Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:282863b7aca4687bff1a01122ab94c4d23e54a9274d81c191452cd2da4d6c93b
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a908783c91cbc9db27fd59d4444bb32b8cd58e1a6dd48eaa98d0fc0a0f5bb49e
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54e10f7302d44b0ad8c0fde13e349bccbe1b9b3cdbbae35183fcad3fe874e07f
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e6c2be9a17165decdd93382b6edbe0f4c0fa4df04593cbd0621e53b355429c2
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -21,3 +21,27 @@
|
|
21 |
{"current_steps": 210, "total_steps": 678, "loss": 0.8194, "lr": 5e-06, "epoch": 0.9286898839137645, "percentage": 30.97, "elapsed_time": "3:21:37", "remaining_time": "7:29:19"}
|
22 |
{"current_steps": 220, "total_steps": 678, "loss": 0.8192, "lr": 5e-06, "epoch": 0.9729132117191819, "percentage": 32.45, "elapsed_time": "3:31:12", "remaining_time": "7:19:42"}
|
23 |
{"current_steps": 226, "total_steps": 678, "eval_loss": 0.8188642859458923, "epoch": 0.9994472084024323, "percentage": 33.33, "elapsed_time": "3:41:06", "remaining_time": "7:22:12"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
{"current_steps": 210, "total_steps": 678, "loss": 0.8194, "lr": 5e-06, "epoch": 0.9286898839137645, "percentage": 30.97, "elapsed_time": "3:21:37", "remaining_time": "7:29:19"}
|
22 |
{"current_steps": 220, "total_steps": 678, "loss": 0.8192, "lr": 5e-06, "epoch": 0.9729132117191819, "percentage": 32.45, "elapsed_time": "3:31:12", "remaining_time": "7:19:42"}
|
23 |
{"current_steps": 226, "total_steps": 678, "eval_loss": 0.8188642859458923, "epoch": 0.9994472084024323, "percentage": 33.33, "elapsed_time": "3:41:06", "remaining_time": "7:22:12"}
|
24 |
+
{"current_steps": 230, "total_steps": 678, "loss": 0.8736, "lr": 5e-06, "epoch": 1.0171365395245993, "percentage": 33.92, "elapsed_time": "3:45:57", "remaining_time": "7:20:08"}
|
25 |
+
{"current_steps": 240, "total_steps": 678, "loss": 0.7791, "lr": 5e-06, "epoch": 1.0613598673300166, "percentage": 35.4, "elapsed_time": "3:55:33", "remaining_time": "7:09:54"}
|
26 |
+
{"current_steps": 250, "total_steps": 678, "loss": 0.7727, "lr": 5e-06, "epoch": 1.105583195135434, "percentage": 36.87, "elapsed_time": "4:05:09", "remaining_time": "6:59:42"}
|
27 |
+
{"current_steps": 260, "total_steps": 678, "loss": 0.7744, "lr": 5e-06, "epoch": 1.1498065229408514, "percentage": 38.35, "elapsed_time": "4:14:45", "remaining_time": "6:49:34"}
|
28 |
+
{"current_steps": 270, "total_steps": 678, "loss": 0.7782, "lr": 5e-06, "epoch": 1.1940298507462686, "percentage": 39.82, "elapsed_time": "4:24:21", "remaining_time": "6:39:29"}
|
29 |
+
{"current_steps": 280, "total_steps": 678, "loss": 0.7725, "lr": 5e-06, "epoch": 1.238253178551686, "percentage": 41.3, "elapsed_time": "4:33:57", "remaining_time": "6:29:25"}
|
30 |
+
{"current_steps": 290, "total_steps": 678, "loss": 0.7743, "lr": 5e-06, "epoch": 1.2824765063571033, "percentage": 42.77, "elapsed_time": "4:43:33", "remaining_time": "6:19:22"}
|
31 |
+
{"current_steps": 300, "total_steps": 678, "loss": 0.7771, "lr": 5e-06, "epoch": 1.3266998341625207, "percentage": 44.25, "elapsed_time": "4:53:08", "remaining_time": "6:09:22"}
|
32 |
+
{"current_steps": 310, "total_steps": 678, "loss": 0.7791, "lr": 5e-06, "epoch": 1.370923161967938, "percentage": 45.72, "elapsed_time": "5:02:44", "remaining_time": "5:59:23"}
|
33 |
+
{"current_steps": 320, "total_steps": 678, "loss": 0.7701, "lr": 5e-06, "epoch": 1.4151464897733554, "percentage": 47.2, "elapsed_time": "5:12:20", "remaining_time": "5:49:26"}
|
34 |
+
{"current_steps": 330, "total_steps": 678, "loss": 0.7744, "lr": 5e-06, "epoch": 1.4593698175787728, "percentage": 48.67, "elapsed_time": "5:21:56", "remaining_time": "5:39:30"}
|
35 |
+
{"current_steps": 340, "total_steps": 678, "loss": 0.7742, "lr": 5e-06, "epoch": 1.5035931453841902, "percentage": 50.15, "elapsed_time": "5:31:32", "remaining_time": "5:29:35"}
|
36 |
+
{"current_steps": 350, "total_steps": 678, "loss": 0.7766, "lr": 5e-06, "epoch": 1.5478164731896076, "percentage": 51.62, "elapsed_time": "5:41:07", "remaining_time": "5:19:41"}
|
37 |
+
{"current_steps": 360, "total_steps": 678, "loss": 0.7655, "lr": 5e-06, "epoch": 1.5920398009950247, "percentage": 53.1, "elapsed_time": "5:50:43", "remaining_time": "5:09:48"}
|
38 |
+
{"current_steps": 370, "total_steps": 678, "loss": 0.7664, "lr": 5e-06, "epoch": 1.6362631288004423, "percentage": 54.57, "elapsed_time": "6:00:19", "remaining_time": "4:59:56"}
|
39 |
+
{"current_steps": 380, "total_steps": 678, "loss": 0.7734, "lr": 5e-06, "epoch": 1.6804864566058595, "percentage": 56.05, "elapsed_time": "6:09:55", "remaining_time": "4:50:05"}
|
40 |
+
{"current_steps": 390, "total_steps": 678, "loss": 0.7697, "lr": 5e-06, "epoch": 1.724709784411277, "percentage": 57.52, "elapsed_time": "6:19:31", "remaining_time": "4:40:15"}
|
41 |
+
{"current_steps": 400, "total_steps": 678, "loss": 0.7698, "lr": 5e-06, "epoch": 1.7689331122166942, "percentage": 59.0, "elapsed_time": "6:29:08", "remaining_time": "4:30:26"}
|
42 |
+
{"current_steps": 410, "total_steps": 678, "loss": 0.7701, "lr": 5e-06, "epoch": 1.8131564400221116, "percentage": 60.47, "elapsed_time": "6:38:44", "remaining_time": "4:20:38"}
|
43 |
+
{"current_steps": 420, "total_steps": 678, "loss": 0.7673, "lr": 5e-06, "epoch": 1.857379767827529, "percentage": 61.95, "elapsed_time": "6:48:20", "remaining_time": "4:10:50"}
|
44 |
+
{"current_steps": 430, "total_steps": 678, "loss": 0.7782, "lr": 5e-06, "epoch": 1.9016030956329464, "percentage": 63.42, "elapsed_time": "6:57:56", "remaining_time": "4:01:02"}
|
45 |
+
{"current_steps": 440, "total_steps": 678, "loss": 0.7657, "lr": 5e-06, "epoch": 1.9458264234383638, "percentage": 64.9, "elapsed_time": "7:07:32", "remaining_time": "3:51:15"}
|
46 |
+
{"current_steps": 450, "total_steps": 678, "loss": 0.773, "lr": 5e-06, "epoch": 1.9900497512437811, "percentage": 66.37, "elapsed_time": "7:17:08", "remaining_time": "3:41:29"}
|
47 |
+
{"current_steps": 452, "total_steps": 678, "eval_loss": 0.8043199181556702, "epoch": 1.9988944168048646, "percentage": 66.67, "elapsed_time": "7:23:17", "remaining_time": "3:41:38"}
|