sachin commited on
Commit
009e3ec
·
verified ·
1 Parent(s): 0670e66

2024-12-18-15-38-01

Browse files
README.md CHANGED
@@ -34,16 +34,20 @@ More information needed
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0001
37
- - train_batch_size: 8
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - gradient_accumulation_steps: 2
41
- - total_train_batch_size: 16
42
  - optimizer: Use paged_adamw_8bit with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - lr_scheduler_warmup_steps: 50
45
  - num_epochs: 2
46
 
 
 
 
 
47
  ### Framework versions
48
 
49
  - PEFT 0.14.0
 
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0001
37
+ - train_batch_size: 4
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - gradient_accumulation_steps: 2
41
+ - total_train_batch_size: 8
42
  - optimizer: Use paged_adamw_8bit with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - lr_scheduler_warmup_steps: 50
45
  - num_epochs: 2
46
 
47
+ ### Training results
48
+
49
+
50
+
51
  ### Framework versions
52
 
53
  - PEFT 0.14.0
adapter_config.json CHANGED
@@ -27,12 +27,12 @@
27
  "revision": null,
28
  "target_modules": [
29
  "gate_proj",
30
- "up_proj",
31
- "o_proj",
32
  "down_proj",
33
- "q_proj",
34
  "k_proj",
35
- "v_proj"
 
36
  ],
37
  "task_type": null,
38
  "use_dora": false,
 
27
  "revision": null,
28
  "target_modules": [
29
  "gate_proj",
30
+ "v_proj",
 
31
  "down_proj",
32
+ "up_proj",
33
  "k_proj",
34
+ "q_proj",
35
+ "o_proj"
36
  ],
37
  "task_type": null,
38
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0de7981adf78b5cd6fec87b9b8f63414eaa767187d209eb18994a368160042f
3
  size 36981072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e78360308a1be6d34038ca06da6156096c5095c08ce35657a6066df431458a00
3
  size 36981072
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9128f85f4032d1e8e8949c41b05e5aa0303cf4010c2ed2dd7ab32649ac7e4c0c
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d680724ae53cf05e4f8c3d0264c79a9fe57361214e446256c8d3759b9286cb09
3
  size 5368