toilaluan commited on
Commit
b10d14c
·
verified ·
1 Parent(s): b7a708f

Training in progress, step 4500

Browse files
adapter_config.json CHANGED
@@ -1 +1,41 @@
1
- {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "DeepMount00/Llama-3-8b-Ita", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["o_proj", "gate_proj", "down_proj", "q_proj", "out_proj", "query_key_value", "up_proj", "k_proj", "v_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "DeepMount00/Llama-3-8b-Ita",
5
+ "bias": "none",
6
+ "corda_config": null,
7
+ "eva_config": null,
8
+ "exclude_modules": null,
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": true,
12
+ "layer_replication": null,
13
+ "layers_pattern": null,
14
+ "layers_to_transform": null,
15
+ "loftq_config": {},
16
+ "lora_alpha": 256,
17
+ "lora_bias": false,
18
+ "lora_dropout": 0.0,
19
+ "megatron_config": null,
20
+ "megatron_core": "megatron.core",
21
+ "modules_to_save": null,
22
+ "peft_type": "LORA",
23
+ "r": 128,
24
+ "rank_pattern": {},
25
+ "revision": null,
26
+ "target_modules": [
27
+ "v_proj",
28
+ "query_key_value",
29
+ "down_proj",
30
+ "out_proj",
31
+ "o_proj",
32
+ "k_proj",
33
+ "up_proj",
34
+ "q_proj",
35
+ "gate_proj"
36
+ ],
37
+ "task_type": "CAUSAL_LM",
38
+ "trainable_token_indices": null,
39
+ "use_dora": false,
40
+ "use_rslora": false
41
+ }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64b6aa33832d0d07d57dca4a7c2a8e07ac398948af54aebf07704d4493be1232
3
  size 1342238560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e829e2de319c5684041606ea3f279775eba97da5fcdedfe992d3078175bc1c14
3
  size 1342238560
toilaluan/bf0c13f3-6e2f-4cf7-aa39-cafe6a49051e/adapter_config.json CHANGED
@@ -1 +1 @@
1
- {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "DeepMount00/Llama-3-8b-Ita", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["out_proj", "o_proj", "v_proj", "down_proj", "q_proj", "k_proj", "query_key_value", "gate_proj", "up_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
 
1
+ {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "DeepMount00/Llama-3-8b-Ita", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["o_proj", "gate_proj", "down_proj", "q_proj", "out_proj", "query_key_value", "up_proj", "k_proj", "v_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a80339fd00b8c6ec910c51b16a50018434748ecd352a5c039889a20cc0403b69
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77addcdce5d8fbb4db14c5505c22819cb08647c68cb6e374bc0b2ad40062c025
3
  size 5752