hivetechVN commited on
Commit
eebb028
·
verified ·
1 Parent(s): d0b8f4a

End of training

Browse files
README.md CHANGED
@@ -36,8 +36,8 @@ This model was trained with SFT.
36
 
37
  - TRL: 0.15.1
38
  - Transformers: 4.49.0
39
- - Pytorch: 2.4.1+cu121
40
- - Datasets: 3.2.0
41
  - Tokenizers: 0.21.0
42
 
43
  ## Citations
 
36
 
37
  - TRL: 0.15.1
38
  - Transformers: 4.49.0
39
+ - Pytorch: 2.5.1+cu121
40
+ - Datasets: 3.3.1
41
  - Tokenizers: 0.21.0
42
 
43
  ## Citations
adapter_config.json CHANGED
@@ -12,22 +12,22 @@
12
  "layers_pattern": null,
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
- "lora_alpha": 32,
16
  "lora_bias": false,
17
  "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
- "r": 8,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "q_proj",
27
- "v_proj",
28
- "gate_proj",
29
  "o_proj",
30
  "k_proj",
 
 
 
31
  "up_proj",
32
  "down_proj"
33
  ],
 
12
  "layers_pattern": null,
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
+ "lora_alpha": 8,
16
  "lora_bias": false,
17
  "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
+ "r": 16,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
26
  "o_proj",
27
  "k_proj",
28
+ "gate_proj",
29
+ "q_proj",
30
+ "v_proj",
31
  "up_proj",
32
  "down_proj"
33
  ],
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2f7aac257193429b2d0b249169272f4779908ca9c4c180572b7007f44ab8e80
3
- size 48679352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f18a823d269720f308bd71bfb4672017bd2cb2254c4d393036c1fbbe1aa4a89
3
+ size 97307544
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bff0889f4e69961d2cfe60b76d01f2cc8932e1251c18f43875d3cfce5e9bee1a
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:986b67fd0aedf9101749792ccb23747b957837b5e8ed1d458a996e48342f7a3d
3
  size 5624