Training in progress, step 510
Browse files
model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5000000704
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67d2d85758228e26293a147261eeed022a0713ab01f1b86e93758a1f068ec8f8
|
3 |
size 5000000704
|
model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4857411192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b1037a778f3b065b19e19ec0a44008768f77ba149986ae1149e127697dfd51c
|
3 |
size 4857411192
|
model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3921970888
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8306211928142112e2074094fca257a6af3d70d16cf1be2a3f4bea74bd8d4aef
|
3 |
size 3921970888
|
trainer_log.jsonl
CHANGED
@@ -508,3 +508,33 @@
|
|
508 |
{"current_steps": 508, "total_steps": 9875, "loss": 0.9558, "lr": 5.1417004048583e-06, "epoch": 0.25721518987341774, "percentage": 5.14, "elapsed_time": "1:26:10", "remaining_time": "1 day, 2:28:58"}
|
509 |
{"current_steps": 509, "total_steps": 9875, "loss": 1.0187, "lr": 5.151821862348178e-06, "epoch": 0.25772151898734175, "percentage": 5.15, "elapsed_time": "1:26:12", "remaining_time": "1 day, 2:26:11"}
|
510 |
{"current_steps": 510, "total_steps": 9875, "loss": 1.069, "lr": 5.1619433198380576e-06, "epoch": 0.2582278481012658, "percentage": 5.16, "elapsed_time": "1:26:13", "remaining_time": "1 day, 2:23:23"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
508 |
{"current_steps": 508, "total_steps": 9875, "loss": 0.9558, "lr": 5.1417004048583e-06, "epoch": 0.25721518987341774, "percentage": 5.14, "elapsed_time": "1:26:10", "remaining_time": "1 day, 2:28:58"}
|
509 |
{"current_steps": 509, "total_steps": 9875, "loss": 1.0187, "lr": 5.151821862348178e-06, "epoch": 0.25772151898734175, "percentage": 5.15, "elapsed_time": "1:26:12", "remaining_time": "1 day, 2:26:11"}
|
510 |
{"current_steps": 510, "total_steps": 9875, "loss": 1.069, "lr": 5.1619433198380576e-06, "epoch": 0.2582278481012658, "percentage": 5.16, "elapsed_time": "1:26:13", "remaining_time": "1 day, 2:23:23"}
|
511 |
+
{"current_steps": 511, "total_steps": 9875, "loss": 0.9909, "lr": 5.172064777327935e-06, "epoch": 0.2587341772151899, "percentage": 5.17, "elapsed_time": "1:27:36", "remaining_time": "1 day, 2:45:16"}
|
512 |
+
{"current_steps": 512, "total_steps": 9875, "loss": 1.0835, "lr": 5.1821862348178145e-06, "epoch": 0.25924050632911394, "percentage": 5.18, "elapsed_time": "1:27:37", "remaining_time": "1 day, 2:42:27"}
|
513 |
+
{"current_steps": 513, "total_steps": 9875, "loss": 1.0285, "lr": 5.192307692307693e-06, "epoch": 0.25974683544303795, "percentage": 5.19, "elapsed_time": "1:27:39", "remaining_time": "1 day, 2:39:38"}
|
514 |
+
{"current_steps": 514, "total_steps": 9875, "loss": 0.9788, "lr": 5.202429149797571e-06, "epoch": 0.260253164556962, "percentage": 5.21, "elapsed_time": "1:27:40", "remaining_time": "1 day, 2:36:50"}
|
515 |
+
{"current_steps": 515, "total_steps": 9875, "loss": 1.0412, "lr": 5.21255060728745e-06, "epoch": 0.2607594936708861, "percentage": 5.22, "elapsed_time": "1:27:42", "remaining_time": "1 day, 2:34:05"}
|
516 |
+
{"current_steps": 516, "total_steps": 9875, "loss": 1.0391, "lr": 5.222672064777329e-06, "epoch": 0.26126582278481014, "percentage": 5.23, "elapsed_time": "1:27:44", "remaining_time": "1 day, 2:31:18"}
|
517 |
+
{"current_steps": 517, "total_steps": 9875, "loss": 0.9375, "lr": 5.232793522267207e-06, "epoch": 0.26177215189873415, "percentage": 5.24, "elapsed_time": "1:27:45", "remaining_time": "1 day, 2:28:32"}
|
518 |
+
{"current_steps": 518, "total_steps": 9875, "loss": 1.0521, "lr": 5.242914979757085e-06, "epoch": 0.2622784810126582, "percentage": 5.25, "elapsed_time": "1:27:47", "remaining_time": "1 day, 2:25:46"}
|
519 |
+
{"current_steps": 519, "total_steps": 9875, "loss": 1.126, "lr": 5.253036437246965e-06, "epoch": 0.2627848101265823, "percentage": 5.26, "elapsed_time": "1:27:48", "remaining_time": "1 day, 2:23:02"}
|
520 |
+
{"current_steps": 520, "total_steps": 9875, "loss": 1.0252, "lr": 5.263157894736842e-06, "epoch": 0.26329113924050634, "percentage": 5.27, "elapsed_time": "1:27:50", "remaining_time": "1 day, 2:20:18"}
|
521 |
+
{"current_steps": 521, "total_steps": 9875, "loss": 1.0089, "lr": 5.2732793522267215e-06, "epoch": 0.26379746835443035, "percentage": 5.28, "elapsed_time": "1:29:00", "remaining_time": "1 day, 2:38:03"}
|
522 |
+
{"current_steps": 522, "total_steps": 9875, "loss": 1.1345, "lr": 5.2834008097166e-06, "epoch": 0.2643037974683544, "percentage": 5.29, "elapsed_time": "1:29:02", "remaining_time": "1 day, 2:35:17"}
|
523 |
+
{"current_steps": 523, "total_steps": 9875, "loss": 0.9995, "lr": 5.293522267206478e-06, "epoch": 0.2648101265822785, "percentage": 5.3, "elapsed_time": "1:29:03", "remaining_time": "1 day, 2:32:33"}
|
524 |
+
{"current_steps": 524, "total_steps": 9875, "loss": 0.9631, "lr": 5.303643724696357e-06, "epoch": 0.26531645569620255, "percentage": 5.31, "elapsed_time": "1:29:05", "remaining_time": "1 day, 2:29:49"}
|
525 |
+
{"current_steps": 525, "total_steps": 9875, "loss": 1.0409, "lr": 5.313765182186235e-06, "epoch": 0.26582278481012656, "percentage": 5.32, "elapsed_time": "1:29:06", "remaining_time": "1 day, 2:27:05"}
|
526 |
+
{"current_steps": 526, "total_steps": 9875, "loss": 1.0228, "lr": 5.323886639676114e-06, "epoch": 0.2663291139240506, "percentage": 5.33, "elapsed_time": "1:29:08", "remaining_time": "1 day, 2:24:22"}
|
527 |
+
{"current_steps": 527, "total_steps": 9875, "loss": 1.0736, "lr": 5.334008097165992e-06, "epoch": 0.2668354430379747, "percentage": 5.34, "elapsed_time": "1:29:10", "remaining_time": "1 day, 2:21:40"}
|
528 |
+
{"current_steps": 528, "total_steps": 9875, "loss": 1.0613, "lr": 5.344129554655872e-06, "epoch": 0.26734177215189875, "percentage": 5.35, "elapsed_time": "1:29:11", "remaining_time": "1 day, 2:18:58"}
|
529 |
+
{"current_steps": 529, "total_steps": 9875, "loss": 1.0405, "lr": 5.354251012145749e-06, "epoch": 0.26784810126582276, "percentage": 5.36, "elapsed_time": "1:29:13", "remaining_time": "1 day, 2:16:17"}
|
530 |
+
{"current_steps": 530, "total_steps": 9875, "loss": 1.0296, "lr": 5.364372469635628e-06, "epoch": 0.2683544303797468, "percentage": 5.37, "elapsed_time": "1:29:14", "remaining_time": "1 day, 2:13:36"}
|
531 |
+
{"current_steps": 531, "total_steps": 9875, "loss": 1.0532, "lr": 5.374493927125507e-06, "epoch": 0.2688607594936709, "percentage": 5.38, "elapsed_time": "1:30:20", "remaining_time": "1 day, 2:29:44"}
|
532 |
+
{"current_steps": 532, "total_steps": 9875, "loss": 1.0248, "lr": 5.384615384615385e-06, "epoch": 0.26936708860759495, "percentage": 5.39, "elapsed_time": "1:30:22", "remaining_time": "1 day, 2:27:03"}
|
533 |
+
{"current_steps": 533, "total_steps": 9875, "loss": 1.2742, "lr": 5.394736842105264e-06, "epoch": 0.26987341772151896, "percentage": 5.4, "elapsed_time": "1:30:23", "remaining_time": "1 day, 2:24:22"}
|
534 |
+
{"current_steps": 534, "total_steps": 9875, "loss": 1.0865, "lr": 5.4048582995951424e-06, "epoch": 0.270379746835443, "percentage": 5.41, "elapsed_time": "1:30:25", "remaining_time": "1 day, 2:21:41"}
|
535 |
+
{"current_steps": 535, "total_steps": 9875, "loss": 1.0238, "lr": 5.41497975708502e-06, "epoch": 0.2708860759493671, "percentage": 5.42, "elapsed_time": "1:30:26", "remaining_time": "1 day, 2:19:01"}
|
536 |
+
{"current_steps": 536, "total_steps": 9875, "loss": 0.9916, "lr": 5.425101214574899e-06, "epoch": 0.27139240506329115, "percentage": 5.43, "elapsed_time": "1:30:28", "remaining_time": "1 day, 2:16:22"}
|
537 |
+
{"current_steps": 537, "total_steps": 9875, "loss": 1.1823, "lr": 5.435222672064779e-06, "epoch": 0.27189873417721516, "percentage": 5.44, "elapsed_time": "1:30:30", "remaining_time": "1 day, 2:13:43"}
|
538 |
+
{"current_steps": 538, "total_steps": 9875, "loss": 1.0289, "lr": 5.445344129554656e-06, "epoch": 0.2724050632911392, "percentage": 5.45, "elapsed_time": "1:30:31", "remaining_time": "1 day, 2:11:05"}
|
539 |
+
{"current_steps": 539, "total_steps": 9875, "loss": 1.0893, "lr": 5.455465587044535e-06, "epoch": 0.2729113924050633, "percentage": 5.46, "elapsed_time": "1:30:33", "remaining_time": "1 day, 2:08:28"}
|
540 |
+
{"current_steps": 540, "total_steps": 9875, "loss": 1.1109, "lr": 5.465587044534414e-06, "epoch": 0.27341772151898736, "percentage": 5.47, "elapsed_time": "1:30:34", "remaining_time": "1 day, 2:05:51"}
|