Training in progress, step 5500
Browse files
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 42002584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93b669005c07fa16bbd13ca192d6c99a2118e0e9eca5eea001d58c992b020b7f
|
3 |
size 42002584
|
runs/Jan28_08-58-19_COE-CS-sv003/events.out.tfevents.1738054724.COE-CS-sv003.4044272.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:125917f64bcd852c13d6c0a33727ec44e008146642b53d9deff979f7033be424
|
3 |
+
size 121488
|
trainer_log.jsonl
CHANGED
@@ -498,3 +498,53 @@
|
|
498 |
{"current_steps": 4980, "total_steps": 5625, "loss": 0.0526, "lr": 3.2093162080754637e-06, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "12:37:46", "remaining_time": "1:38:08"}
|
499 |
{"current_steps": 4990, "total_steps": 5625, "loss": 0.0602, "lr": 3.1116112956677046e-06, "epoch": 2.6613333333333333, "percentage": 88.71, "elapsed_time": "12:39:17", "remaining_time": "1:36:37"}
|
500 |
{"current_steps": 5000, "total_steps": 5625, "loss": 0.0601, "lr": 3.0153689607045845e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "12:40:48", "remaining_time": "1:35:06"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
498 |
{"current_steps": 4980, "total_steps": 5625, "loss": 0.0526, "lr": 3.2093162080754637e-06, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "12:37:46", "remaining_time": "1:38:08"}
|
499 |
{"current_steps": 4990, "total_steps": 5625, "loss": 0.0602, "lr": 3.1116112956677046e-06, "epoch": 2.6613333333333333, "percentage": 88.71, "elapsed_time": "12:39:17", "remaining_time": "1:36:37"}
|
500 |
{"current_steps": 5000, "total_steps": 5625, "loss": 0.0601, "lr": 3.0153689607045845e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "12:40:48", "remaining_time": "1:35:06"}
|
501 |
+
{"current_steps": 5010, "total_steps": 5625, "loss": 0.0743, "lr": 2.9205922052484958e-06, "epoch": 2.672, "percentage": 89.07, "elapsed_time": "12:42:27", "remaining_time": "1:33:35"}
|
502 |
+
{"current_steps": 5020, "total_steps": 5625, "loss": 0.0562, "lr": 2.8272839856463783e-06, "epoch": 2.6773333333333333, "percentage": 89.24, "elapsed_time": "12:43:58", "remaining_time": "1:32:04"}
|
503 |
+
{"current_steps": 5030, "total_steps": 5625, "loss": 0.0384, "lr": 2.735447212437531e-06, "epoch": 2.6826666666666665, "percentage": 89.42, "elapsed_time": "12:45:29", "remaining_time": "1:30:32"}
|
504 |
+
{"current_steps": 5040, "total_steps": 5625, "loss": 0.0485, "lr": 2.6450847502627884e-06, "epoch": 2.6879999999999997, "percentage": 89.6, "elapsed_time": "12:46:59", "remaining_time": "1:29:01"}
|
505 |
+
{"current_steps": 5050, "total_steps": 5625, "loss": 0.0525, "lr": 2.5561994177751737e-06, "epoch": 2.6933333333333334, "percentage": 89.78, "elapsed_time": "12:48:30", "remaining_time": "1:27:30"}
|
506 |
+
{"current_steps": 5060, "total_steps": 5625, "loss": 0.0571, "lr": 2.468793987551998e-06, "epoch": 2.6986666666666665, "percentage": 89.96, "elapsed_time": "12:50:01", "remaining_time": "1:25:58"}
|
507 |
+
{"current_steps": 5070, "total_steps": 5625, "loss": 0.0528, "lr": 2.3828711860083674e-06, "epoch": 2.7039999999999997, "percentage": 90.13, "elapsed_time": "12:51:31", "remaining_time": "1:24:27"}
|
508 |
+
{"current_steps": 5080, "total_steps": 5625, "loss": 0.0431, "lr": 2.2984336933121075e-06, "epoch": 2.7093333333333334, "percentage": 90.31, "elapsed_time": "12:53:02", "remaining_time": "1:22:56"}
|
509 |
+
{"current_steps": 5090, "total_steps": 5625, "loss": 0.0523, "lr": 2.2154841433002062e-06, "epoch": 2.7146666666666666, "percentage": 90.49, "elapsed_time": "12:54:34", "remaining_time": "1:21:24"}
|
510 |
+
{"current_steps": 5100, "total_steps": 5625, "loss": 0.054, "lr": 2.134025123396638e-06, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "12:56:05", "remaining_time": "1:19:53"}
|
511 |
+
{"current_steps": 5110, "total_steps": 5625, "loss": 0.0686, "lr": 2.054059174531653e-06, "epoch": 2.7253333333333334, "percentage": 90.84, "elapsed_time": "12:57:36", "remaining_time": "1:18:22"}
|
512 |
+
{"current_steps": 5120, "total_steps": 5625, "loss": 0.0542, "lr": 1.9755887910625105e-06, "epoch": 2.7306666666666666, "percentage": 91.02, "elapsed_time": "12:59:08", "remaining_time": "1:16:50"}
|
513 |
+
{"current_steps": 5130, "total_steps": 5625, "loss": 0.0591, "lr": 1.8986164206957035e-06, "epoch": 2.7359999999999998, "percentage": 91.2, "elapsed_time": "13:00:39", "remaining_time": "1:15:19"}
|
514 |
+
{"current_steps": 5140, "total_steps": 5625, "loss": 0.076, "lr": 1.8231444644105756e-06, "epoch": 2.7413333333333334, "percentage": 91.38, "elapsed_time": "13:02:10", "remaining_time": "1:13:48"}
|
515 |
+
{"current_steps": 5150, "total_steps": 5625, "loss": 0.0576, "lr": 1.7491752763844293e-06, "epoch": 2.7466666666666666, "percentage": 91.56, "elapsed_time": "13:03:42", "remaining_time": "1:12:17"}
|
516 |
+
{"current_steps": 5160, "total_steps": 5625, "loss": 0.0687, "lr": 1.6767111639191202e-06, "epoch": 2.752, "percentage": 91.73, "elapsed_time": "13:05:13", "remaining_time": "1:10:45"}
|
517 |
+
{"current_steps": 5170, "total_steps": 5625, "loss": 0.0573, "lr": 1.6057543873690683e-06, "epoch": 2.7573333333333334, "percentage": 91.91, "elapsed_time": "13:06:44", "remaining_time": "1:09:14"}
|
518 |
+
{"current_steps": 5180, "total_steps": 5625, "loss": 0.0578, "lr": 1.5363071600707435e-06, "epoch": 2.7626666666666666, "percentage": 92.09, "elapsed_time": "13:08:16", "remaining_time": "1:07:43"}
|
519 |
+
{"current_steps": 5190, "total_steps": 5625, "loss": 0.0698, "lr": 1.4683716482736366e-06, "epoch": 2.768, "percentage": 92.27, "elapsed_time": "13:09:47", "remaining_time": "1:06:11"}
|
520 |
+
{"current_steps": 5200, "total_steps": 5625, "loss": 0.0594, "lr": 1.4019499710726913e-06, "epoch": 2.7733333333333334, "percentage": 92.44, "elapsed_time": "13:11:19", "remaining_time": "1:04:40"}
|
521 |
+
{"current_steps": 5210, "total_steps": 5625, "loss": 0.0645, "lr": 1.3370442003421913e-06, "epoch": 2.7786666666666666, "percentage": 92.62, "elapsed_time": "13:12:50", "remaining_time": "1:03:09"}
|
522 |
+
{"current_steps": 5220, "total_steps": 5625, "loss": 0.1017, "lr": 1.2736563606711382e-06, "epoch": 2.784, "percentage": 92.8, "elapsed_time": "13:14:22", "remaining_time": "1:01:37"}
|
523 |
+
{"current_steps": 5230, "total_steps": 5625, "loss": 0.0622, "lr": 1.2117884293001258e-06, "epoch": 2.7893333333333334, "percentage": 92.98, "elapsed_time": "13:15:53", "remaining_time": "1:00:06"}
|
524 |
+
{"current_steps": 5240, "total_steps": 5625, "loss": 0.0401, "lr": 1.1514423360595938e-06, "epoch": 2.7946666666666666, "percentage": 93.16, "elapsed_time": "13:17:24", "remaining_time": "0:58:35"}
|
525 |
+
{"current_steps": 5250, "total_steps": 5625, "loss": 0.0639, "lr": 1.0926199633097157e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "13:18:55", "remaining_time": "0:57:03"}
|
526 |
+
{"current_steps": 5260, "total_steps": 5625, "loss": 0.0525, "lr": 1.0353231458816337e-06, "epoch": 2.8053333333333335, "percentage": 93.51, "elapsed_time": "13:20:27", "remaining_time": "0:55:32"}
|
527 |
+
{"current_steps": 5270, "total_steps": 5625, "loss": 0.0647, "lr": 9.795536710202169e-07, "epoch": 2.8106666666666666, "percentage": 93.69, "elapsed_time": "13:21:58", "remaining_time": "0:54:01"}
|
528 |
+
{"current_steps": 5280, "total_steps": 5625, "loss": 0.0967, "lr": 9.253132783283547e-07, "epoch": 2.816, "percentage": 93.87, "elapsed_time": "13:23:30", "remaining_time": "0:52:30"}
|
529 |
+
{"current_steps": 5290, "total_steps": 5625, "loss": 0.049, "lr": 8.726036597126619e-07, "epoch": 2.8213333333333335, "percentage": 94.04, "elapsed_time": "13:25:01", "remaining_time": "0:50:58"}
|
530 |
+
{"current_steps": 5300, "total_steps": 5625, "loss": 0.0496, "lr": 8.214264593307098e-07, "epoch": 2.8266666666666667, "percentage": 94.22, "elapsed_time": "13:26:32", "remaining_time": "0:49:27"}
|
531 |
+
{"current_steps": 5310, "total_steps": 5625, "loss": 0.0596, "lr": 7.717832735397335e-07, "epoch": 2.832, "percentage": 94.4, "elapsed_time": "13:28:03", "remaining_time": "0:47:56"}
|
532 |
+
{"current_steps": 5320, "total_steps": 5625, "loss": 0.0735, "lr": 7.236756508468611e-07, "epoch": 2.8373333333333335, "percentage": 94.58, "elapsed_time": "13:29:35", "remaining_time": "0:46:24"}
|
533 |
+
{"current_steps": 5330, "total_steps": 5625, "loss": 0.0389, "lr": 6.771050918607913e-07, "epoch": 2.8426666666666667, "percentage": 94.76, "elapsed_time": "13:31:06", "remaining_time": "0:44:53"}
|
534 |
+
{"current_steps": 5340, "total_steps": 5625, "loss": 0.0546, "lr": 6.3207304924498e-07, "epoch": 2.848, "percentage": 94.93, "elapsed_time": "13:32:37", "remaining_time": "0:43:22"}
|
535 |
+
{"current_steps": 5350, "total_steps": 5625, "loss": 0.0581, "lr": 5.885809276723608e-07, "epoch": 2.8533333333333335, "percentage": 95.11, "elapsed_time": "13:34:09", "remaining_time": "0:41:50"}
|
536 |
+
{"current_steps": 5360, "total_steps": 5625, "loss": 0.0645, "lr": 5.466300837814797e-07, "epoch": 2.8586666666666667, "percentage": 95.29, "elapsed_time": "13:35:40", "remaining_time": "0:40:19"}
|
537 |
+
{"current_steps": 5370, "total_steps": 5625, "loss": 0.0559, "lr": 5.062218261342122e-07, "epoch": 2.864, "percentage": 95.47, "elapsed_time": "13:37:12", "remaining_time": "0:38:48"}
|
538 |
+
{"current_steps": 5380, "total_steps": 5625, "loss": 0.0425, "lr": 4.673574151749571e-07, "epoch": 2.8693333333333335, "percentage": 95.64, "elapsed_time": "13:38:43", "remaining_time": "0:37:17"}
|
539 |
+
{"current_steps": 5390, "total_steps": 5625, "loss": 0.0542, "lr": 4.300380631912737e-07, "epoch": 2.8746666666666667, "percentage": 95.82, "elapsed_time": "13:40:14", "remaining_time": "0:35:45"}
|
540 |
+
{"current_steps": 5400, "total_steps": 5625, "loss": 0.0616, "lr": 3.9426493427611177e-07, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "13:41:45", "remaining_time": "0:34:14"}
|
541 |
+
{"current_steps": 5410, "total_steps": 5625, "loss": 0.0676, "lr": 3.600391442914741e-07, "epoch": 2.8853333333333335, "percentage": 96.18, "elapsed_time": "13:43:17", "remaining_time": "0:32:43"}
|
542 |
+
{"current_steps": 5420, "total_steps": 5625, "loss": 0.0864, "lr": 3.2736176083362216e-07, "epoch": 2.8906666666666667, "percentage": 96.36, "elapsed_time": "13:44:48", "remaining_time": "0:31:11"}
|
543 |
+
{"current_steps": 5430, "total_steps": 5625, "loss": 0.0438, "lr": 2.962338031997691e-07, "epoch": 2.896, "percentage": 96.53, "elapsed_time": "13:46:19", "remaining_time": "0:29:40"}
|
544 |
+
{"current_steps": 5440, "total_steps": 5625, "loss": 0.0572, "lr": 2.666562423562946e-07, "epoch": 2.9013333333333335, "percentage": 96.71, "elapsed_time": "13:47:50", "remaining_time": "0:28:09"}
|
545 |
+
{"current_steps": 5450, "total_steps": 5625, "loss": 0.0508, "lr": 2.386300009084408e-07, "epoch": 2.9066666666666667, "percentage": 96.89, "elapsed_time": "13:49:21", "remaining_time": "0:26:37"}
|
546 |
+
{"current_steps": 5460, "total_steps": 5625, "loss": 0.0557, "lr": 2.1215595307154667e-07, "epoch": 2.912, "percentage": 97.07, "elapsed_time": "13:50:53", "remaining_time": "0:25:06"}
|
547 |
+
{"current_steps": 5470, "total_steps": 5625, "loss": 0.0435, "lr": 1.872349246437699e-07, "epoch": 2.9173333333333336, "percentage": 97.24, "elapsed_time": "13:52:24", "remaining_time": "0:23:35"}
|
548 |
+
{"current_steps": 5480, "total_steps": 5625, "loss": 0.0529, "lr": 1.6386769298034065e-07, "epoch": 2.9226666666666667, "percentage": 97.42, "elapsed_time": "13:53:55", "remaining_time": "0:22:03"}
|
549 |
+
{"current_steps": 5490, "total_steps": 5625, "loss": 0.0563, "lr": 1.420549869693033e-07, "epoch": 2.928, "percentage": 97.6, "elapsed_time": "13:55:26", "remaining_time": "0:20:32"}
|
550 |
+
{"current_steps": 5500, "total_steps": 5625, "loss": 0.057, "lr": 1.2179748700879012e-07, "epoch": 2.9333333333333336, "percentage": 97.78, "elapsed_time": "13:56:57", "remaining_time": "0:19:01"}
|