Training in progress, step 1400
Browse files- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- trainer_log.jsonl +4 -8
- training_args.bin +1 -1
adapter_config.json
CHANGED
@@ -23,13 +23,13 @@
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
-
"q_proj",
|
27 |
-
"v_proj",
|
28 |
-
"o_proj",
|
29 |
-
"up_proj",
|
30 |
"k_proj",
|
31 |
"down_proj",
|
32 |
-
"
|
|
|
|
|
|
|
|
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
|
|
|
|
|
|
|
|
26 |
"k_proj",
|
27 |
"down_proj",
|
28 |
+
"v_proj",
|
29 |
+
"up_proj",
|
30 |
+
"o_proj",
|
31 |
+
"gate_proj",
|
32 |
+
"q_proj"
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 147770496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1615841c13c049e702c516acde8d23f94d7116112383ee44425bbf84b72e56d7
|
3 |
size 147770496
|
trainer_log.jsonl
CHANGED
@@ -1,8 +1,4 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps": 1330, "total_steps": 2553, "loss": 0.5151, "lr": 0.00014120290854186863, "epoch": 1.5627019089574157, "percentage": 52.1, "elapsed_time": "2:55:11", "remaining_time": "2:41:05"}
|
6 |
-
{"current_steps": 1340, "total_steps": 2553, "loss": 0.507, "lr": 0.00013935373390146634, "epoch": 1.5744493392070484, "percentage": 52.49, "elapsed_time": "3:30:20", "remaining_time": "3:10:24"}
|
7 |
-
{"current_steps": 1350, "total_steps": 2553, "loss": 0.4973, "lr": 0.00013750618405697912, "epoch": 1.5861967694566812, "percentage": 52.88, "elapsed_time": "4:05:30", "remaining_time": "3:38:46"}
|
8 |
-
{"current_steps": 1360, "total_steps": 2553, "loss": 0.5033, "lr": 0.0001356605409750058, "epoch": 1.5979441997063142, "percentage": 53.27, "elapsed_time": "4:40:38", "remaining_time": "4:06:11"}
|
|
|
1 |
+
{"current_steps": 1370, "total_steps": 2553, "loss": 0.5259, "lr": 0.0001340013252947644, "epoch": 1.6096916299559472, "percentage": 53.66, "elapsed_time": "0:34:02", "remaining_time": "0:29:23"}
|
2 |
+
{"current_steps": 1380, "total_steps": 2553, "loss": 0.5164, "lr": 0.00013216008080267535, "epoch": 1.6214390602055802, "percentage": 54.05, "elapsed_time": "1:08:10", "remaining_time": "0:57:57"}
|
3 |
+
{"current_steps": 1390, "total_steps": 2553, "loss": 0.5011, "lr": 0.0001303215589766901, "epoch": 1.633186490455213, "percentage": 54.45, "elapsed_time": "1:42:17", "remaining_time": "1:25:35"}
|
4 |
+
{"current_steps": 1400, "total_steps": 2553, "loss": 0.5096, "lr": 0.00012848604040558272, "epoch": 1.6449339207048457, "percentage": 54.84, "elapsed_time": "2:16:30", "remaining_time": "1:52:25"}
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5752
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4096d841cf7ca75806307b6c6b7d6fa53491e67ad1132e299019b216142f58b9
|
3 |
size 5752
|