Rakancorle1 commited on
Commit
eafa850
·
verified ·
1 Parent(s): 4d66eb1

Training in progress, step 5500

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7615a57c2afa77ba1ab2c9613b08df0b66d411adac39151d1f07baa3bdf12ea
3
  size 42002584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93b669005c07fa16bbd13ca192d6c99a2118e0e9eca5eea001d58c992b020b7f
3
  size 42002584
runs/Jan28_08-58-19_COE-CS-sv003/events.out.tfevents.1738054724.COE-CS-sv003.4044272.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c85783e8c4242588b6e64fd42241865c67fce93e7145667fa27c4b4b4cc659d
3
- size 110938
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:125917f64bcd852c13d6c0a33727ec44e008146642b53d9deff979f7033be424
3
+ size 121488
trainer_log.jsonl CHANGED
@@ -498,3 +498,53 @@
498
  {"current_steps": 4980, "total_steps": 5625, "loss": 0.0526, "lr": 3.2093162080754637e-06, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "12:37:46", "remaining_time": "1:38:08"}
499
  {"current_steps": 4990, "total_steps": 5625, "loss": 0.0602, "lr": 3.1116112956677046e-06, "epoch": 2.6613333333333333, "percentage": 88.71, "elapsed_time": "12:39:17", "remaining_time": "1:36:37"}
500
  {"current_steps": 5000, "total_steps": 5625, "loss": 0.0601, "lr": 3.0153689607045845e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "12:40:48", "remaining_time": "1:35:06"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
498
  {"current_steps": 4980, "total_steps": 5625, "loss": 0.0526, "lr": 3.2093162080754637e-06, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "12:37:46", "remaining_time": "1:38:08"}
499
  {"current_steps": 4990, "total_steps": 5625, "loss": 0.0602, "lr": 3.1116112956677046e-06, "epoch": 2.6613333333333333, "percentage": 88.71, "elapsed_time": "12:39:17", "remaining_time": "1:36:37"}
500
  {"current_steps": 5000, "total_steps": 5625, "loss": 0.0601, "lr": 3.0153689607045845e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "12:40:48", "remaining_time": "1:35:06"}
501
+ {"current_steps": 5010, "total_steps": 5625, "loss": 0.0743, "lr": 2.9205922052484958e-06, "epoch": 2.672, "percentage": 89.07, "elapsed_time": "12:42:27", "remaining_time": "1:33:35"}
502
+ {"current_steps": 5020, "total_steps": 5625, "loss": 0.0562, "lr": 2.8272839856463783e-06, "epoch": 2.6773333333333333, "percentage": 89.24, "elapsed_time": "12:43:58", "remaining_time": "1:32:04"}
503
+ {"current_steps": 5030, "total_steps": 5625, "loss": 0.0384, "lr": 2.735447212437531e-06, "epoch": 2.6826666666666665, "percentage": 89.42, "elapsed_time": "12:45:29", "remaining_time": "1:30:32"}
504
+ {"current_steps": 5040, "total_steps": 5625, "loss": 0.0485, "lr": 2.6450847502627884e-06, "epoch": 2.6879999999999997, "percentage": 89.6, "elapsed_time": "12:46:59", "remaining_time": "1:29:01"}
505
+ {"current_steps": 5050, "total_steps": 5625, "loss": 0.0525, "lr": 2.5561994177751737e-06, "epoch": 2.6933333333333334, "percentage": 89.78, "elapsed_time": "12:48:30", "remaining_time": "1:27:30"}
506
+ {"current_steps": 5060, "total_steps": 5625, "loss": 0.0571, "lr": 2.468793987551998e-06, "epoch": 2.6986666666666665, "percentage": 89.96, "elapsed_time": "12:50:01", "remaining_time": "1:25:58"}
507
+ {"current_steps": 5070, "total_steps": 5625, "loss": 0.0528, "lr": 2.3828711860083674e-06, "epoch": 2.7039999999999997, "percentage": 90.13, "elapsed_time": "12:51:31", "remaining_time": "1:24:27"}
508
+ {"current_steps": 5080, "total_steps": 5625, "loss": 0.0431, "lr": 2.2984336933121075e-06, "epoch": 2.7093333333333334, "percentage": 90.31, "elapsed_time": "12:53:02", "remaining_time": "1:22:56"}
509
+ {"current_steps": 5090, "total_steps": 5625, "loss": 0.0523, "lr": 2.2154841433002062e-06, "epoch": 2.7146666666666666, "percentage": 90.49, "elapsed_time": "12:54:34", "remaining_time": "1:21:24"}
510
+ {"current_steps": 5100, "total_steps": 5625, "loss": 0.054, "lr": 2.134025123396638e-06, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "12:56:05", "remaining_time": "1:19:53"}
511
+ {"current_steps": 5110, "total_steps": 5625, "loss": 0.0686, "lr": 2.054059174531653e-06, "epoch": 2.7253333333333334, "percentage": 90.84, "elapsed_time": "12:57:36", "remaining_time": "1:18:22"}
512
+ {"current_steps": 5120, "total_steps": 5625, "loss": 0.0542, "lr": 1.9755887910625105e-06, "epoch": 2.7306666666666666, "percentage": 91.02, "elapsed_time": "12:59:08", "remaining_time": "1:16:50"}
513
+ {"current_steps": 5130, "total_steps": 5625, "loss": 0.0591, "lr": 1.8986164206957035e-06, "epoch": 2.7359999999999998, "percentage": 91.2, "elapsed_time": "13:00:39", "remaining_time": "1:15:19"}
514
+ {"current_steps": 5140, "total_steps": 5625, "loss": 0.076, "lr": 1.8231444644105756e-06, "epoch": 2.7413333333333334, "percentage": 91.38, "elapsed_time": "13:02:10", "remaining_time": "1:13:48"}
515
+ {"current_steps": 5150, "total_steps": 5625, "loss": 0.0576, "lr": 1.7491752763844293e-06, "epoch": 2.7466666666666666, "percentage": 91.56, "elapsed_time": "13:03:42", "remaining_time": "1:12:17"}
516
+ {"current_steps": 5160, "total_steps": 5625, "loss": 0.0687, "lr": 1.6767111639191202e-06, "epoch": 2.752, "percentage": 91.73, "elapsed_time": "13:05:13", "remaining_time": "1:10:45"}
517
+ {"current_steps": 5170, "total_steps": 5625, "loss": 0.0573, "lr": 1.6057543873690683e-06, "epoch": 2.7573333333333334, "percentage": 91.91, "elapsed_time": "13:06:44", "remaining_time": "1:09:14"}
518
+ {"current_steps": 5180, "total_steps": 5625, "loss": 0.0578, "lr": 1.5363071600707435e-06, "epoch": 2.7626666666666666, "percentage": 92.09, "elapsed_time": "13:08:16", "remaining_time": "1:07:43"}
519
+ {"current_steps": 5190, "total_steps": 5625, "loss": 0.0698, "lr": 1.4683716482736366e-06, "epoch": 2.768, "percentage": 92.27, "elapsed_time": "13:09:47", "remaining_time": "1:06:11"}
520
+ {"current_steps": 5200, "total_steps": 5625, "loss": 0.0594, "lr": 1.4019499710726913e-06, "epoch": 2.7733333333333334, "percentage": 92.44, "elapsed_time": "13:11:19", "remaining_time": "1:04:40"}
521
+ {"current_steps": 5210, "total_steps": 5625, "loss": 0.0645, "lr": 1.3370442003421913e-06, "epoch": 2.7786666666666666, "percentage": 92.62, "elapsed_time": "13:12:50", "remaining_time": "1:03:09"}
522
+ {"current_steps": 5220, "total_steps": 5625, "loss": 0.1017, "lr": 1.2736563606711382e-06, "epoch": 2.784, "percentage": 92.8, "elapsed_time": "13:14:22", "remaining_time": "1:01:37"}
523
+ {"current_steps": 5230, "total_steps": 5625, "loss": 0.0622, "lr": 1.2117884293001258e-06, "epoch": 2.7893333333333334, "percentage": 92.98, "elapsed_time": "13:15:53", "remaining_time": "1:00:06"}
524
+ {"current_steps": 5240, "total_steps": 5625, "loss": 0.0401, "lr": 1.1514423360595938e-06, "epoch": 2.7946666666666666, "percentage": 93.16, "elapsed_time": "13:17:24", "remaining_time": "0:58:35"}
525
+ {"current_steps": 5250, "total_steps": 5625, "loss": 0.0639, "lr": 1.0926199633097157e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "13:18:55", "remaining_time": "0:57:03"}
526
+ {"current_steps": 5260, "total_steps": 5625, "loss": 0.0525, "lr": 1.0353231458816337e-06, "epoch": 2.8053333333333335, "percentage": 93.51, "elapsed_time": "13:20:27", "remaining_time": "0:55:32"}
527
+ {"current_steps": 5270, "total_steps": 5625, "loss": 0.0647, "lr": 9.795536710202169e-07, "epoch": 2.8106666666666666, "percentage": 93.69, "elapsed_time": "13:21:58", "remaining_time": "0:54:01"}
528
+ {"current_steps": 5280, "total_steps": 5625, "loss": 0.0967, "lr": 9.253132783283547e-07, "epoch": 2.816, "percentage": 93.87, "elapsed_time": "13:23:30", "remaining_time": "0:52:30"}
529
+ {"current_steps": 5290, "total_steps": 5625, "loss": 0.049, "lr": 8.726036597126619e-07, "epoch": 2.8213333333333335, "percentage": 94.04, "elapsed_time": "13:25:01", "remaining_time": "0:50:58"}
530
+ {"current_steps": 5300, "total_steps": 5625, "loss": 0.0496, "lr": 8.214264593307098e-07, "epoch": 2.8266666666666667, "percentage": 94.22, "elapsed_time": "13:26:32", "remaining_time": "0:49:27"}
531
+ {"current_steps": 5310, "total_steps": 5625, "loss": 0.0596, "lr": 7.717832735397335e-07, "epoch": 2.832, "percentage": 94.4, "elapsed_time": "13:28:03", "remaining_time": "0:47:56"}
532
+ {"current_steps": 5320, "total_steps": 5625, "loss": 0.0735, "lr": 7.236756508468611e-07, "epoch": 2.8373333333333335, "percentage": 94.58, "elapsed_time": "13:29:35", "remaining_time": "0:46:24"}
533
+ {"current_steps": 5330, "total_steps": 5625, "loss": 0.0389, "lr": 6.771050918607913e-07, "epoch": 2.8426666666666667, "percentage": 94.76, "elapsed_time": "13:31:06", "remaining_time": "0:44:53"}
534
+ {"current_steps": 5340, "total_steps": 5625, "loss": 0.0546, "lr": 6.3207304924498e-07, "epoch": 2.848, "percentage": 94.93, "elapsed_time": "13:32:37", "remaining_time": "0:43:22"}
535
+ {"current_steps": 5350, "total_steps": 5625, "loss": 0.0581, "lr": 5.885809276723608e-07, "epoch": 2.8533333333333335, "percentage": 95.11, "elapsed_time": "13:34:09", "remaining_time": "0:41:50"}
536
+ {"current_steps": 5360, "total_steps": 5625, "loss": 0.0645, "lr": 5.466300837814797e-07, "epoch": 2.8586666666666667, "percentage": 95.29, "elapsed_time": "13:35:40", "remaining_time": "0:40:19"}
537
+ {"current_steps": 5370, "total_steps": 5625, "loss": 0.0559, "lr": 5.062218261342122e-07, "epoch": 2.864, "percentage": 95.47, "elapsed_time": "13:37:12", "remaining_time": "0:38:48"}
538
+ {"current_steps": 5380, "total_steps": 5625, "loss": 0.0425, "lr": 4.673574151749571e-07, "epoch": 2.8693333333333335, "percentage": 95.64, "elapsed_time": "13:38:43", "remaining_time": "0:37:17"}
539
+ {"current_steps": 5390, "total_steps": 5625, "loss": 0.0542, "lr": 4.300380631912737e-07, "epoch": 2.8746666666666667, "percentage": 95.82, "elapsed_time": "13:40:14", "remaining_time": "0:35:45"}
540
+ {"current_steps": 5400, "total_steps": 5625, "loss": 0.0616, "lr": 3.9426493427611177e-07, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "13:41:45", "remaining_time": "0:34:14"}
541
+ {"current_steps": 5410, "total_steps": 5625, "loss": 0.0676, "lr": 3.600391442914741e-07, "epoch": 2.8853333333333335, "percentage": 96.18, "elapsed_time": "13:43:17", "remaining_time": "0:32:43"}
542
+ {"current_steps": 5420, "total_steps": 5625, "loss": 0.0864, "lr": 3.2736176083362216e-07, "epoch": 2.8906666666666667, "percentage": 96.36, "elapsed_time": "13:44:48", "remaining_time": "0:31:11"}
543
+ {"current_steps": 5430, "total_steps": 5625, "loss": 0.0438, "lr": 2.962338031997691e-07, "epoch": 2.896, "percentage": 96.53, "elapsed_time": "13:46:19", "remaining_time": "0:29:40"}
544
+ {"current_steps": 5440, "total_steps": 5625, "loss": 0.0572, "lr": 2.666562423562946e-07, "epoch": 2.9013333333333335, "percentage": 96.71, "elapsed_time": "13:47:50", "remaining_time": "0:28:09"}
545
+ {"current_steps": 5450, "total_steps": 5625, "loss": 0.0508, "lr": 2.386300009084408e-07, "epoch": 2.9066666666666667, "percentage": 96.89, "elapsed_time": "13:49:21", "remaining_time": "0:26:37"}
546
+ {"current_steps": 5460, "total_steps": 5625, "loss": 0.0557, "lr": 2.1215595307154667e-07, "epoch": 2.912, "percentage": 97.07, "elapsed_time": "13:50:53", "remaining_time": "0:25:06"}
547
+ {"current_steps": 5470, "total_steps": 5625, "loss": 0.0435, "lr": 1.872349246437699e-07, "epoch": 2.9173333333333336, "percentage": 97.24, "elapsed_time": "13:52:24", "remaining_time": "0:23:35"}
548
+ {"current_steps": 5480, "total_steps": 5625, "loss": 0.0529, "lr": 1.6386769298034065e-07, "epoch": 2.9226666666666667, "percentage": 97.42, "elapsed_time": "13:53:55", "remaining_time": "0:22:03"}
549
+ {"current_steps": 5490, "total_steps": 5625, "loss": 0.0563, "lr": 1.420549869693033e-07, "epoch": 2.928, "percentage": 97.6, "elapsed_time": "13:55:26", "remaining_time": "0:20:32"}
550
+ {"current_steps": 5500, "total_steps": 5625, "loss": 0.057, "lr": 1.2179748700879012e-07, "epoch": 2.9333333333333336, "percentage": 97.78, "elapsed_time": "13:56:57", "remaining_time": "0:19:01"}