Training in progress, step 750
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34d3f8c2e71532662ea56e3ab463b51e70826ab34095977f9a31251797e6eb34
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e805d58b57c3b66882904f3dcef86fe6595b7d7f1e817ed5cfc893ef0b7c66af
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d0bbb1c7380d833e01c76c33fc472277768ec40a718ff6d6d93a626ab30434a
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1164805d08b40dcc8ad1cac56e5380ce388e7f4bcd0eba196676086963bbe137
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -58,3 +58,19 @@
|
|
58 |
{"current_steps": 580, "total_steps": 750, "loss": 0.26, "lr": 1.4850947128716914e-06, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "1 day, 11:02:45", "remaining_time": "10:16:19"}
|
59 |
{"current_steps": 590, "total_steps": 750, "loss": 0.258, "lr": 1.3234549597008572e-06, "epoch": 2.36, "percentage": 78.67, "elapsed_time": "1 day, 11:38:54", "remaining_time": "9:40:02"}
|
60 |
{"current_steps": 600, "total_steps": 750, "loss": 0.2637, "lr": 1.1697777844051105e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1 day, 12:14:51", "remaining_time": "9:03:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
58 |
{"current_steps": 580, "total_steps": 750, "loss": 0.26, "lr": 1.4850947128716914e-06, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "1 day, 11:02:45", "remaining_time": "10:16:19"}
|
59 |
{"current_steps": 590, "total_steps": 750, "loss": 0.258, "lr": 1.3234549597008572e-06, "epoch": 2.36, "percentage": 78.67, "elapsed_time": "1 day, 11:38:54", "remaining_time": "9:40:02"}
|
60 |
{"current_steps": 600, "total_steps": 750, "loss": 0.2637, "lr": 1.1697777844051105e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1 day, 12:14:51", "remaining_time": "9:03:42"}
|
61 |
+
{"current_steps": 610, "total_steps": 750, "loss": 0.2655, "lr": 1.0243960175257605e-06, "epoch": 2.44, "percentage": 81.33, "elapsed_time": "1 day, 12:52:45", "remaining_time": "8:27:50"}
|
62 |
+
{"current_steps": 620, "total_steps": 750, "loss": 0.2525, "lr": 8.876245235966884e-07, "epoch": 2.48, "percentage": 82.67, "elapsed_time": "1 day, 13:28:38", "remaining_time": "7:51:29"}
|
63 |
+
{"current_steps": 630, "total_steps": 750, "loss": 0.2623, "lr": 7.597595192178702e-07, "epoch": 2.52, "percentage": 84.0, "elapsed_time": "1 day, 14:05:25", "remaining_time": "7:15:19"}
|
64 |
+
{"current_steps": 640, "total_steps": 750, "loss": 0.2831, "lr": 6.410779315161885e-07, "epoch": 2.56, "percentage": 85.33, "elapsed_time": "1 day, 14:41:26", "remaining_time": "6:38:59"}
|
65 |
+
{"current_steps": 650, "total_steps": 750, "loss": 0.2634, "lr": 5.318367983829393e-07, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "1 day, 15:17:47", "remaining_time": "6:02:44"}
|
66 |
+
{"current_steps": 660, "total_steps": 750, "loss": 0.2383, "lr": 4.322727117869951e-07, "epoch": 2.64, "percentage": 88.0, "elapsed_time": "1 day, 15:54:07", "remaining_time": "5:26:28"}
|
67 |
+
{"current_steps": 670, "total_steps": 750, "loss": 0.2684, "lr": 3.426013053692878e-07, "epoch": 2.68, "percentage": 89.33, "elapsed_time": "1 day, 16:30:36", "remaining_time": "4:50:13"}
|
68 |
+
{"current_steps": 680, "total_steps": 750, "loss": 0.2586, "lr": 2.63016787428354e-07, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "1 day, 17:06:27", "remaining_time": "4:13:54"}
|
69 |
+
{"current_steps": 690, "total_steps": 750, "loss": 0.2424, "lr": 1.9369152030840553e-07, "epoch": 2.76, "percentage": 92.0, "elapsed_time": "1 day, 17:42:21", "remaining_time": "3:37:35"}
|
70 |
+
{"current_steps": 700, "total_steps": 750, "loss": 0.2795, "lr": 1.3477564710088097e-07, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "1 day, 18:18:20", "remaining_time": "3:01:18"}
|
71 |
+
{"current_steps": 710, "total_steps": 750, "loss": 0.2872, "lr": 8.639676646793382e-08, "epoch": 2.84, "percentage": 94.67, "elapsed_time": "1 day, 18:54:19", "remaining_time": "2:25:01"}
|
72 |
+
{"current_steps": 720, "total_steps": 750, "loss": 0.246, "lr": 4.865965629214819e-08, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "1 day, 19:29:54", "remaining_time": "1:48:44"}
|
73 |
+
{"current_steps": 730, "total_steps": 750, "loss": 0.2513, "lr": 2.1646046750978255e-08, "epoch": 2.92, "percentage": 97.33, "elapsed_time": "1 day, 20:06:48", "remaining_time": "1:12:30"}
|
74 |
+
{"current_steps": 740, "total_steps": 750, "loss": 0.24, "lr": 5.414443307377171e-09, "epoch": 2.96, "percentage": 98.67, "elapsed_time": "1 day, 20:42:11", "remaining_time": "0:36:14"}
|
75 |
+
{"current_steps": 750, "total_steps": 750, "loss": 0.2572, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1 day, 21:18:01", "remaining_time": "0:00:00"}
|
76 |
+
{"current_steps": 750, "total_steps": 750, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1 day, 21:19:39", "remaining_time": "0:00:00"}
|