Training in progress, step 240
Browse files- adapter_config.json +4 -4
- adapter_model.safetensors +1 -1
- trainer_log.jsonl +4 -20
- training_args.bin +2 -2
adapter_config.json
CHANGED
@@ -23,13 +23,13 @@
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
-
"k_proj",
|
27 |
"v_proj",
|
28 |
-
"gate_proj",
|
29 |
-
"up_proj",
|
30 |
"down_proj",
|
|
|
|
|
31 |
"o_proj",
|
32 |
-
"
|
|
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
|
|
26 |
"v_proj",
|
|
|
|
|
27 |
"down_proj",
|
28 |
+
"q_proj",
|
29 |
+
"gate_proj",
|
30 |
"o_proj",
|
31 |
+
"up_proj",
|
32 |
+
"k_proj"
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 147770496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8f96b84f3521835e4c2e7bd5f9446c2060ce1c248af900530e1e084ead567ee
|
3 |
size 147770496
|
trainer_log.jsonl
CHANGED
@@ -1,20 +1,4 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps": 50, "total_steps": 851, "loss": 0.7685, "lr": 0.0002984109778320875, "epoch": 0.05873715124816446, "percentage": 5.88, "elapsed_time": "2:40:40", "remaining_time": "1 day, 18:54:06"}
|
6 |
-
{"current_steps": 60, "total_steps": 851, "loss": 0.7096, "lr": 0.00029749418918542057, "epoch": 0.07048458149779736, "percentage": 7.05, "elapsed_time": "3:12:51", "remaining_time": "1 day, 18:22:25"}
|
7 |
-
{"current_steps": 70, "total_steps": 851, "loss": 0.6901, "lr": 0.0002963716067978866, "epoch": 0.08223201174743025, "percentage": 8.23, "elapsed_time": "3:45:02", "remaining_time": "1 day, 17:50:45"}
|
8 |
-
{"current_steps": 80, "total_steps": 851, "loss": 0.6702, "lr": 0.000295044796971387, "epoch": 0.09397944199706314, "percentage": 9.4, "elapsed_time": "4:17:13", "remaining_time": "1 day, 17:18:56"}
|
9 |
-
{"current_steps": 90, "total_steps": 851, "loss": 0.6353, "lr": 0.000293515610959582, "epoch": 0.10572687224669604, "percentage": 10.58, "elapsed_time": "4:49:24", "remaining_time": "1 day, 16:47:10"}
|
10 |
-
{"current_steps": 100, "total_steps": 851, "loss": 0.6479, "lr": 0.0002917861823848985, "epoch": 0.11747430249632893, "percentage": 11.75, "elapsed_time": "5:21:32", "remaining_time": "1 day, 16:14:43"}
|
11 |
-
{"current_steps": 110, "total_steps": 851, "loss": 0.6244, "lr": 0.0002898589242615568, "epoch": 0.12922173274596183, "percentage": 12.93, "elapsed_time": "5:53:44", "remaining_time": "1 day, 15:42:52"}
|
12 |
-
{"current_steps": 120, "total_steps": 851, "loss": 0.6217, "lr": 0.0002877365256287728, "epoch": 0.14096916299559473, "percentage": 14.1, "elapsed_time": "6:25:57", "remaining_time": "1 day, 15:11:05"}
|
13 |
-
{"current_steps": 130, "total_steps": 851, "loss": 0.6022, "lr": 0.00028542194779883047, "epoch": 0.1527165932452276, "percentage": 15.28, "elapsed_time": "6:58:09", "remaining_time": "1 day, 14:39:12"}
|
14 |
-
{"current_steps": 140, "total_steps": 851, "loss": 0.6098, "lr": 0.00028291842022526133, "epoch": 0.1644640234948605, "percentage": 16.45, "elapsed_time": "7:30:23", "remaining_time": "1 day, 14:07:21"}
|
15 |
-
{"current_steps": 150, "total_steps": 851, "loss": 0.5971, "lr": 0.0002802294359968954, "epoch": 0.1762114537444934, "percentage": 17.63, "elapsed_time": "8:02:40", "remaining_time": "1 day, 13:35:40"}
|
16 |
-
{"current_steps": 160, "total_steps": 851, "loss": 0.5937, "lr": 0.0002773587469640702, "epoch": 0.18795888399412627, "percentage": 18.8, "elapsed_time": "8:34:53", "remaining_time": "1 day, 13:03:40"}
|
17 |
-
{"current_steps": 170, "total_steps": 851, "loss": 0.6054, "lr": 0.0002743103585037989, "epoch": 0.19970631424375918, "percentage": 19.98, "elapsed_time": "9:07:06", "remaining_time": "1 day, 12:31:40"}
|
18 |
-
{"current_steps": 180, "total_steps": 851, "loss": 0.5708, "lr": 0.0002710885239312008, "epoch": 0.21145374449339208, "percentage": 21.15, "elapsed_time": "9:39:20", "remaining_time": "1 day, 11:59:38"}
|
19 |
-
{"current_steps": 190, "total_steps": 851, "loss": 0.5806, "lr": 0.00026769773856499167, "epoch": 0.22320117474302498, "percentage": 22.33, "elapsed_time": "10:11:34", "remaining_time": "1 day, 11:27:38"}
|
20 |
-
{"current_steps": 200, "total_steps": 851, "loss": 0.5747, "lr": 0.0002641427334553158, "epoch": 0.23494860499265785, "percentage": 23.5, "elapsed_time": "10:43:48", "remaining_time": "1 day, 10:55:37"}
|
|
|
1 |
+
{"current_steps": 210, "total_steps": 851, "loss": 0.5879, "lr": 0.00026042846878266795, "epoch": 0.24669603524229075, "percentage": 24.68, "elapsed_time": "0:33:05", "remaining_time": "1:41:00"}
|
2 |
+
{"current_steps": 220, "total_steps": 851, "loss": 0.5852, "lr": 0.0002565601269371192, "epoch": 0.25844346549192365, "percentage": 25.85, "elapsed_time": "1:06:33", "remaining_time": "3:10:55"}
|
3 |
+
{"current_steps": 230, "total_steps": 851, "loss": 0.5605, "lr": 0.0002525431052874997, "epoch": 0.2701908957415565, "percentage": 27.03, "elapsed_time": "1:39:59", "remaining_time": "4:29:59"}
|
4 |
+
{"current_steps": 240, "total_steps": 851, "loss": 0.5738, "lr": 0.00024838300865062966, "epoch": 0.28193832599118945, "percentage": 28.2, "elapsed_time": "2:13:28", "remaining_time": "5:39:47"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8973bbd1b103ead50852e2b114af48d9e0d924c6ae8eab7404eef91ab656cddc
|
3 |
+
size 5752
|