Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b161373ef5a44bcc6e0cdd088b6105e941089fa4f1ab7e86d4fe4365ce5b51e1
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37b593f087584e6189b26da462075bc37a91be7d431044129cd2a83e6e3fb2bf
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b385f7dc6279ccfe020d1c9f1e537295607bbdfd15a9b2ea7c0dafe9e4b430b
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a4167ab79b9ef9e92d684350619f1c8952b1c5b27128456c7574b3eaf2691da
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -22,3 +22,13 @@
|
|
22 |
{"current_steps": 22, "total_steps": 150, "loss": 0.4665, "lr": 3.973523064225159e-05, "epoch": 2.2, "percentage": 14.67, "elapsed_time": "0:14:41", "remaining_time": "1:25:28"}
|
23 |
{"current_steps": 23, "total_steps": 150, "loss": 0.4194, "lr": 3.965441293412827e-05, "epoch": 2.3, "percentage": 15.33, "elapsed_time": "0:15:15", "remaining_time": "1:24:16"}
|
24 |
{"current_steps": 24, "total_steps": 150, "loss": 0.4105, "lr": 3.9562952014676116e-05, "epoch": 2.4, "percentage": 16.0, "elapsed_time": "0:15:51", "remaining_time": "1:23:13"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
22 |
{"current_steps": 22, "total_steps": 150, "loss": 0.4665, "lr": 3.973523064225159e-05, "epoch": 2.2, "percentage": 14.67, "elapsed_time": "0:14:41", "remaining_time": "1:25:28"}
|
23 |
{"current_steps": 23, "total_steps": 150, "loss": 0.4194, "lr": 3.965441293412827e-05, "epoch": 2.3, "percentage": 15.33, "elapsed_time": "0:15:15", "remaining_time": "1:24:16"}
|
24 |
{"current_steps": 24, "total_steps": 150, "loss": 0.4105, "lr": 3.9562952014676116e-05, "epoch": 2.4, "percentage": 16.0, "elapsed_time": "0:15:51", "remaining_time": "1:23:13"}
|
25 |
+
{"current_steps": 25, "total_steps": 150, "loss": 0.433, "lr": 3.946089741159648e-05, "epoch": 2.5, "percentage": 16.67, "elapsed_time": "0:16:33", "remaining_time": "1:22:49"}
|
26 |
+
{"current_steps": 26, "total_steps": 150, "loss": 0.4056, "lr": 3.934830438925728e-05, "epoch": 2.6, "percentage": 17.33, "elapsed_time": "0:17:12", "remaining_time": "1:22:05"}
|
27 |
+
{"current_steps": 27, "total_steps": 150, "loss": 0.4483, "lr": 3.922523391876638e-05, "epoch": 2.7, "percentage": 18.0, "elapsed_time": "0:17:44", "remaining_time": "1:20:50"}
|
28 |
+
{"current_steps": 28, "total_steps": 150, "loss": 0.4313, "lr": 3.909175264495464e-05, "epoch": 2.8, "percentage": 18.67, "elapsed_time": "0:18:13", "remaining_time": "1:19:23"}
|
29 |
+
{"current_steps": 29, "total_steps": 150, "loss": 0.3754, "lr": 3.8947932850286585e-05, "epoch": 2.9, "percentage": 19.33, "elapsed_time": "0:18:47", "remaining_time": "1:18:23"}
|
30 |
+
{"current_steps": 30, "total_steps": 150, "loss": 0.4333, "lr": 3.879385241571817e-05, "epoch": 3.0, "percentage": 20.0, "elapsed_time": "0:19:22", "remaining_time": "1:17:30"}
|
31 |
+
{"current_steps": 31, "total_steps": 150, "loss": 0.295, "lr": 3.862959477852285e-05, "epoch": 3.1, "percentage": 20.67, "elapsed_time": "0:21:05", "remaining_time": "1:20:57"}
|
32 |
+
{"current_steps": 32, "total_steps": 150, "loss": 0.2472, "lr": 3.845524888710885e-05, "epoch": 3.2, "percentage": 21.33, "elapsed_time": "0:21:36", "remaining_time": "1:19:40"}
|
33 |
+
{"current_steps": 33, "total_steps": 150, "loss": 0.2934, "lr": 3.827090915285202e-05, "epoch": 3.3, "percentage": 22.0, "elapsed_time": "0:22:11", "remaining_time": "1:18:40"}
|
34 |
+
{"current_steps": 34, "total_steps": 150, "loss": 0.3205, "lr": 3.807667539897041e-05, "epoch": 3.4, "percentage": 22.67, "elapsed_time": "0:22:53", "remaining_time": "1:18:04"}
|