Training in progress, step 2120
Browse files- adapter_config.json +4 -4
- adapter_model.safetensors +1 -1
- trainer_log.jsonl +4 -20
- training_args.bin +1 -1
adapter_config.json
CHANGED
@@ -23,13 +23,13 @@
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
-
"down_proj",
|
27 |
-
"o_proj",
|
28 |
-
"gate_proj",
|
29 |
"k_proj",
|
30 |
"up_proj",
|
31 |
"v_proj",
|
32 |
-
"
|
|
|
|
|
|
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
|
|
|
|
|
|
26 |
"k_proj",
|
27 |
"up_proj",
|
28 |
"v_proj",
|
29 |
+
"o_proj",
|
30 |
+
"down_proj",
|
31 |
+
"q_proj",
|
32 |
+
"gate_proj"
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 147770496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:788640632106b240e696686df5a835b0ed2407a7d55b40141baf52d658a52e52
|
3 |
size 147770496
|
trainer_log.jsonl
CHANGED
@@ -1,20 +1,4 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps": 1930, "total_steps": 2553, "loss": 0.4768, "lr": 4.253477570863275e-05, "epoch": 2.2678414096916297, "percentage": 75.6, "elapsed_time": "2:46:00", "remaining_time": "0:53:35"}
|
6 |
-
{"current_steps": 1940, "total_steps": 2553, "loss": 0.4915, "lr": 4.1250198564289644e-05, "epoch": 2.2795888399412627, "percentage": 75.99, "elapsed_time": "3:19:18", "remaining_time": "1:02:58"}
|
7 |
-
{"current_steps": 1950, "total_steps": 2553, "loss": 0.4773, "lr": 3.998221843447808e-05, "epoch": 2.2913362701908957, "percentage": 76.38, "elapsed_time": "3:52:20", "remaining_time": "1:11:50"}
|
8 |
-
{"current_steps": 1960, "total_steps": 2553, "loss": 0.4728, "lr": 3.8731028833892955e-05, "epoch": 2.3030837004405287, "percentage": 76.77, "elapsed_time": "4:25:08", "remaining_time": "1:20:13"}
|
9 |
-
{"current_steps": 1970, "total_steps": 2553, "loss": 0.4978, "lr": 3.749682071471727e-05, "epoch": 2.3148311306901617, "percentage": 77.16, "elapsed_time": "4:58:14", "remaining_time": "1:28:15"}
|
10 |
-
{"current_steps": 1980, "total_steps": 2553, "loss": 0.491, "lr": 3.627978243747965e-05, "epoch": 2.3265785609397946, "percentage": 77.56, "elapsed_time": "5:31:32", "remaining_time": "1:35:56"}
|
11 |
-
{"current_steps": 1990, "total_steps": 2553, "loss": 0.4672, "lr": 3.5080099742307495e-05, "epoch": 2.338325991189427, "percentage": 77.95, "elapsed_time": "6:04:49", "remaining_time": "1:43:12"}
|
12 |
-
{"current_steps": 2000, "total_steps": 2553, "loss": 0.4856, "lr": 3.3897955720579985e-05, "epoch": 2.35007342143906, "percentage": 78.34, "elapsed_time": "6:38:07", "remaining_time": "1:50:05"}
|
13 |
-
{"current_steps": 2010, "total_steps": 2553, "loss": 0.4893, "lr": 3.2733530786985124e-05, "epoch": 2.361820851688693, "percentage": 78.73, "elapsed_time": "7:11:25", "remaining_time": "1:56:32"}
|
14 |
-
{"current_steps": 2020, "total_steps": 2553, "loss": 0.4737, "lr": 3.1587002651985776e-05, "epoch": 2.373568281938326, "percentage": 79.12, "elapsed_time": "7:44:36", "remaining_time": "2:02:35"}
|
15 |
-
{"current_steps": 2030, "total_steps": 2553, "loss": 0.4883, "lr": 3.0458546294697954e-05, "epoch": 2.3853157121879587, "percentage": 79.51, "elapsed_time": "8:17:53", "remaining_time": "2:08:16"}
|
16 |
-
{"current_steps": 2040, "total_steps": 2553, "loss": 0.4761, "lr": 2.9348333936186003e-05, "epoch": 2.3970631424375917, "percentage": 79.91, "elapsed_time": "8:51:08", "remaining_time": "2:13:33"}
|
17 |
-
{"current_steps": 2050, "total_steps": 2553, "loss": 0.4867, "lr": 2.82565350131791e-05, "epoch": 2.4088105726872246, "percentage": 80.3, "elapsed_time": "9:24:22", "remaining_time": "2:18:28"}
|
18 |
-
{"current_steps": 2060, "total_steps": 2553, "loss": 0.4759, "lr": 2.718331615221218e-05, "epoch": 2.4205580029368576, "percentage": 80.69, "elapsed_time": "9:57:12", "remaining_time": "2:22:55"}
|
19 |
-
{"current_steps": 2070, "total_steps": 2553, "loss": 0.4881, "lr": 2.61288411441961e-05, "epoch": 2.4323054331864906, "percentage": 81.08, "elapsed_time": "10:30:13", "remaining_time": "2:27:03"}
|
20 |
-
{"current_steps": 2080, "total_steps": 2553, "loss": 0.4973, "lr": 2.5093270919420383e-05, "epoch": 2.444052863436123, "percentage": 81.47, "elapsed_time": "11:03:02", "remaining_time": "2:30:46"}
|
|
|
1 |
+
{"current_steps": 2090, "total_steps": 2553, "loss": 0.4887, "lr": 2.4076763522992665e-05, "epoch": 2.455800293685756, "percentage": 81.86, "elapsed_time": "0:28:01", "remaining_time": "0:06:12"}
|
2 |
+
{"current_steps": 2100, "total_steps": 2553, "loss": 0.4791, "lr": 2.307947409071825e-05, "epoch": 2.467547723935389, "percentage": 82.26, "elapsed_time": "0:56:03", "remaining_time": "0:12:05"}
|
3 |
+
{"current_steps": 2110, "total_steps": 2553, "loss": 0.4822, "lr": 2.210155482542402e-05, "epoch": 2.479295154185022, "percentage": 82.65, "elapsed_time": "1:24:06", "remaining_time": "0:17:39"}
|
4 |
+
{"current_steps": 2120, "total_steps": 2553, "loss": 0.4776, "lr": 2.1143154973729735e-05, "epoch": 2.491042584434655, "percentage": 83.04, "elapsed_time": "1:52:11", "remaining_time": "0:22:54"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5752
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f37c4f9def600a9e6150e724b6c67a6e551e6b342060fe9dc2e069df8930045
|
3 |
size 5752
|