Training in progress, step 100

Browse files

Files changed (10) hide show

README.md +4 -4
adapter_config.json +4 -4
adapter_model.safetensors +2 -2
chat_template.jinja +4 -47
runs/Oct25_18-48-25_afc9ba227e8c/events.out.tfevents.1761418110.afc9ba227e8c.4998.0 +3 -0
special_tokens_map.json +4 -3
tokenizer.json +2 -2
tokenizer.model +2 -2
tokenizer_config.json +0 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,17 +1,17 @@
 ---
-base_model: google/gemma-3-1b-it
 library_name: transformers
 model_name: Quotes_Generator
 tags:
 - generated_from_trainer
-- trl
 - sft
 licence: license
 ---
 # Model Card for Quotes_Generator
-This model is a fine-tuned version of [google/gemma-3-1b-it](https://huggingface.co/google/gemma-3-1b-it).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/not-lain/huggingface/runs/16bwzxjk)
 This model was trained with SFT.

 ---
+base_model: google/gemma-2b-it
 library_name: transformers
 model_name: Quotes_Generator
 tags:
 - generated_from_trainer
 - sft
+- trl
 licence: license
 ---
 # Model Card for Quotes_Generator
+This model is a fine-tuned version of [google/gemma-2b-it](https://huggingface.co/google/gemma-2b-it).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/not-lain/huggingface/runs/3ddd7vxd)
 This model was trained with SFT.

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "google/gemma-3-1b-it",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
@@ -25,12 +25,12 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
     "o_proj",
     "down_proj",
-    "q_proj",
     "v_proj",
-    "gate_proj",
     "up_proj"
   ],
   "target_parameters": null,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "google/gemma-2b-it",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
     "o_proj",
+    "gate_proj",
     "down_proj",
     "v_proj",
+    "k_proj",
     "up_proj"
   ],
   "target_parameters": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:684fd7ad6b94d5dffa2870e75b48534f34b74495df45687e03adb6e7345bcf96
-size 26139264

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4b08564ae986eada55bcbbc877876b78e6b7b9f98be533f53c5b84a8ba55964
+size 39256456

chat_template.jinja CHANGED Viewed

@@ -1,47 +1,4 @@
-{{ bos_token }}
-{%- if messages[0]['role'] == 'system' -%}
-    {%- if messages[0]['content'] is string -%}
-        {%- set first_user_prefix = messages[0]['content'] + '
-' -%}
-    {%- else -%}
-        {%- set first_user_prefix = messages[0]['content'][0]['text'] + '
-' -%}
-    {%- endif -%}
-    {%- set loop_messages = messages[1:] -%}
-{%- else -%}
-    {%- set first_user_prefix = "" -%}
-    {%- set loop_messages = messages -%}
-{%- endif -%}
-{%- for message in loop_messages -%}
-    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}
-        {{ raise_exception("Conversation roles must alternate user/assistant/user/assistant/...") }}
-    {%- endif -%}
-    {%- if (message['role'] == 'assistant') -%}
-        {%- set role = "model" -%}
-    {%- else -%}
-        {%- set role = message['role'] -%}
-    {%- endif -%}
-    {{ '<start_of_turn>' + role + '
-' + (first_user_prefix if loop.first else "") }}
-    {%- if message['content'] is string -%}
-        {{ message['content'] | trim }}
-    {%- elif message['content'] is iterable -%}
-        {%- for item in message['content'] -%}
-            {%- if item['type'] == 'image' -%}
-                {{ '<start_of_image>' }}
-            {%- elif item['type'] == 'text' -%}
-                {{ item['text'] | trim }}
-            {%- endif -%}
-        {%- endfor -%}
-    {%- else -%}
-        {{ raise_exception("Invalid content type") }}
-    {%- endif -%}
-    {{ '<end_of_turn>
-' }}
-{%- endfor -%}
-{%- if add_generation_prompt -%}
-    {{'<start_of_turn>model
-'}}
-{%- endif -%}

+{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '
+' + message['content'] | trim + '<end_of_turn>
+' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model
+'}}{% endif %}

runs/Oct25_18-48-25_afc9ba227e8c/events.out.tfevents.1761418110.afc9ba227e8c.4998.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:782ee83a6f144885f5576452df4f60c9476d97553d7b8148de7dc1a60340943e
+size 43844

special_tokens_map.json CHANGED Viewed

@@ -1,5 +1,8 @@
 {
-  "boi_token": "<start_of_image>",
   "bos_token": {
     "content": "<bos>",
     "lstrip": false,
@@ -7,7 +10,6 @@
     "rstrip": false,
     "single_word": false
   },
-  "eoi_token": "<end_of_image>",
   "eos_token": {
     "content": "<eos>",
     "lstrip": false,
@@ -15,7 +17,6 @@
     "rstrip": false,
     "single_word": false
   },
-  "image_token": "<image_soft_token>",
   "pad_token": {
     "content": "<pad>",
     "lstrip": false,

 {
+  "additional_special_tokens": [
+    "<start_of_turn>",
+    "<end_of_turn>"
+  ],
   "bos_token": {
     "content": "<bos>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
   "eos_token": {
     "content": "<eos>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
   "pad_token": {
     "content": "<pad>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4667f2089529e8e7657cfb6d1c19910ae71ff5f28aa7ab2ff2763330affad795
-size 33384568

 version https://git-lfs.github.com/spec/v1
+oid sha256:f559f2189f392b4555613965f089e7c4d300b41fbe080bf79da0d676e33ee7f0
+size 34356041

tokenizer.model CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
-size 4689074

 version https://git-lfs.github.com/spec/v1
+oid sha256:61a7b147390c64585d6c3543dd6fc636906c9af3865a5548f27f31aee1d4c8e2
+size 4241003

tokenizer_config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70e1a64099f950635da1660f6a046f9e158a52e04beb0051ef2ab9f1056e411a
 size 6225

 version https://git-lfs.github.com/spec/v1
+oid sha256:76cb0ee7d8022d5c3acd59155caf6eb30b56d07b77fff110942b24d07e291db2
 size 6225