m-nzr commited on
Commit
658638f
·
verified ·
1 Parent(s): 3f7736d

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -14,25 +14,17 @@
14
  "loftq_config": {},
15
  "lora_alpha": 16,
16
  "lora_bias": false,
17
- "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
- "modules_to_save": [
21
- "lm_head",
22
- "embed_tokens"
23
- ],
24
  "peft_type": "LORA",
25
- "r": 16,
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
- "o_proj",
30
- "gate_proj",
31
- "q_proj",
32
  "v_proj",
33
- "down_proj",
34
- "up_proj",
35
- "k_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "use_dora": false,
 
14
  "loftq_config": {},
15
  "lora_alpha": 16,
16
  "lora_bias": false,
17
+ "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
+ "modules_to_save": null,
 
 
 
21
  "peft_type": "LORA",
22
+ "r": 8,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
26
  "v_proj",
27
+ "q_proj"
 
 
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c7aa6805a20957ebec1a52bc24543392d8141dd70480a2387939eac0fcd5e94
3
- size 2468152240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06562ceb5a9d97f0ebbf2d49a44645ec057282f23bee2e11575e5c752c22157e
3
+ size 2995512
runs/Jun05_08-19-14_a1ca53c52470/events.out.tfevents.1749111773.a1ca53c52470.267.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7748b9beb16d190efd788bd5584066fe3a894ea8884b30c0814150f0f6f3f6e
3
+ size 12698
tokenizer_config.json CHANGED
@@ -51325,7 +51325,7 @@
51325
  },
51326
  "boi_token": "<start_of_image>",
51327
  "bos_token": "<bos>",
51328
- "chat_template": "{{ bos_token }}\n{%- if messages[0]['role'] == 'system' -%}\n {%- if messages[0]['content'] is string -%}\n {%- set first_user_prefix = messages[0]['content'] + '\n\n' -%}\n {%- else -%}\n {%- set first_user_prefix = messages[0]['content'][0]['text'] + '\n\n' -%}\n {%- endif -%}\n {%- set loop_messages = messages[1:] -%}\n{%- else -%}\n {%- set first_user_prefix = \"\" -%}\n {%- set loop_messages = messages -%}\n{%- endif -%}\n{%- for message in loop_messages -%}\n {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}\n {{ raise_exception(\"Conversation roles must alternate user/assistant/user/assistant/...\") }}\n {%- endif -%}\n {%- if (message['role'] == 'assistant') -%}\n {%- set role = \"model\" -%}\n {%- else -%}\n {%- set role = message['role'] -%}\n {%- endif -%}\n {{ '<start_of_turn>' + role + '\n' + (first_user_prefix if loop.first else \"\") }}\n {%- if message['content'] is string -%}\n {{ message['content'] | trim }}\n {%- elif message['content'] is iterable -%}\n {%- for item in message['content'] -%}\n {%- if item['type'] == 'image' -%}\n {{ '<start_of_image>' }}\n {%- elif item['type'] == 'text' -%}\n {{ item['text'] | trim }}\n {%- endif -%}\n {%- endfor -%}\n {%- else -%}\n {{ raise_exception(\"Invalid content type\") }}\n {%- endif -%}\n {{ '<end_of_turn>\n' }}\n{%- endfor -%}\n{%- if add_generation_prompt -%}\n {{'<start_of_turn>model\n'}}\n{%- endif -%}\n",
51329
  "clean_up_tokenization_spaces": false,
51330
  "eoi_token": "<end_of_image>",
51331
  "eos_token": "<eos>",
 
51325
  },
51326
  "boi_token": "<start_of_image>",
51327
  "bos_token": "<bos>",
51328
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}<start_of_turn>system\n{{ message['content'] }}<end_of_turn>\n{% elif message['role'] == 'user' %}<start_of_turn>user\n{{ message['content'] }}<end_of_turn>\n{% elif message['role'] == 'assistant' %}<start_of_turn>model\n{{ message['content'] }}<end_of_turn>\n{% endif %}{% endfor %}",
51329
  "clean_up_tokenization_spaces": false,
51330
  "eoi_token": "<end_of_image>",
51331
  "eos_token": "<eos>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:565bc04f7c093d29b82670fe6b634f2ccfffc247f4cddd5129dc04c9a9bc745d
3
  size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8dc3a2faa9bddaddb97efdc13c0d54db0a2d5bc563c12a321be9b147ba07fd
3
  size 5688