|
{"current_steps": 1, "total_steps": 296, "loss": 0.8793, "lr": 1.111111111111111e-06, "epoch": 0.003368421052631579, "percentage": 0.34, "elapsed_time": "0:02:02", "remaining_time": "9:59:52"} |
|
{"current_steps": 2, "total_steps": 296, "loss": 0.9892, "lr": 2.222222222222222e-06, "epoch": 0.006736842105263158, "percentage": 0.68, "elapsed_time": "0:03:42", "remaining_time": "9:04:52"} |
|
{"current_steps": 3, "total_steps": 296, "loss": 0.9881, "lr": 3.3333333333333333e-06, "epoch": 0.010105263157894737, "percentage": 1.01, "elapsed_time": "0:05:23", "remaining_time": "8:46:16"} |
|
{"current_steps": 4, "total_steps": 296, "loss": 0.9518, "lr": 4.444444444444444e-06, "epoch": 0.013473684210526317, "percentage": 1.35, "elapsed_time": "0:07:03", "remaining_time": "8:34:43"} |
|
{"current_steps": 5, "total_steps": 296, "loss": 0.9289, "lr": 5.555555555555557e-06, "epoch": 0.016842105263157894, "percentage": 1.69, "elapsed_time": "0:08:44", "remaining_time": "8:28:23"} |
|
{"current_steps": 5, "total_steps": 296, "eval_loss": 0.827698826789856, "epoch": 0.016842105263157894, "percentage": 1.69, "elapsed_time": "0:16:06", "remaining_time": "15:37:19"} |
|
{"current_steps": 6, "total_steps": 296, "loss": 0.805, "lr": 6.666666666666667e-06, "epoch": 0.020210526315789474, "percentage": 2.03, "elapsed_time": "0:18:44", "remaining_time": "15:05:53"} |
|
{"current_steps": 7, "total_steps": 296, "loss": 0.7305, "lr": 7.77777777777778e-06, "epoch": 0.023578947368421053, "percentage": 2.36, "elapsed_time": "0:20:27", "remaining_time": "14:04:25"} |
|
{"current_steps": 8, "total_steps": 296, "loss": 0.8816, "lr": 8.888888888888888e-06, "epoch": 0.026947368421052633, "percentage": 2.7, "elapsed_time": "0:22:09", "remaining_time": "13:17:58"} |
|
{"current_steps": 9, "total_steps": 296, "loss": 0.7849, "lr": 1e-05, "epoch": 0.03031578947368421, "percentage": 3.04, "elapsed_time": "0:23:56", "remaining_time": "12:43:39"} |
|
{"current_steps": 10, "total_steps": 296, "loss": 0.7032, "lr": 9.965156794425088e-06, "epoch": 0.03368421052631579, "percentage": 3.38, "elapsed_time": "0:25:42", "remaining_time": "12:15:28"} |
|
{"current_steps": 10, "total_steps": 296, "eval_loss": 0.6998360753059387, "epoch": 0.03368421052631579, "percentage": 3.38, "elapsed_time": "0:30:39", "remaining_time": "14:36:36"} |
|
{"current_steps": 11, "total_steps": 296, "loss": 0.6569, "lr": 9.930313588850174e-06, "epoch": 0.03705263157894737, "percentage": 3.72, "elapsed_time": "0:32:22", "remaining_time": "13:58:47"} |
|
{"current_steps": 12, "total_steps": 296, "loss": 0.8249, "lr": 9.895470383275261e-06, "epoch": 0.04042105263157895, "percentage": 4.05, "elapsed_time": "0:34:06", "remaining_time": "13:27:03"} |
|
{"current_steps": 13, "total_steps": 296, "loss": 0.7339, "lr": 9.860627177700349e-06, "epoch": 0.043789473684210524, "percentage": 4.39, "elapsed_time": "0:35:50", "remaining_time": "13:00:25"} |
|
{"current_steps": 14, "total_steps": 296, "loss": 0.7037, "lr": 9.825783972125436e-06, "epoch": 0.04715789473684211, "percentage": 4.73, "elapsed_time": "0:37:34", "remaining_time": "12:36:58"} |
|
{"current_steps": 15, "total_steps": 296, "loss": 0.735, "lr": 9.790940766550524e-06, "epoch": 0.05052631578947368, "percentage": 5.07, "elapsed_time": "0:39:19", "remaining_time": "12:16:36"} |
|
{"current_steps": 15, "total_steps": 296, "eval_loss": 0.6130012273788452, "epoch": 0.05052631578947368, "percentage": 5.07, "elapsed_time": "0:44:15", "remaining_time": "13:49:04"} |
|
{"current_steps": 16, "total_steps": 296, "loss": 0.6041, "lr": 9.756097560975611e-06, "epoch": 0.053894736842105266, "percentage": 5.41, "elapsed_time": "0:45:57", "remaining_time": "13:24:14"} |
|
{"current_steps": 17, "total_steps": 296, "loss": 0.5915, "lr": 9.721254355400698e-06, "epoch": 0.05726315789473684, "percentage": 5.74, "elapsed_time": "0:47:38", "remaining_time": "13:01:49"} |
|
{"current_steps": 18, "total_steps": 296, "loss": 0.6117, "lr": 9.686411149825786e-06, "epoch": 0.06063157894736842, "percentage": 6.08, "elapsed_time": "0:49:16", "remaining_time": "12:41:08"} |
|
{"current_steps": 19, "total_steps": 296, "loss": 0.6422, "lr": 9.651567944250871e-06, "epoch": 0.064, "percentage": 6.42, "elapsed_time": "0:50:58", "remaining_time": "12:23:02"} |
|
{"current_steps": 20, "total_steps": 296, "loss": 0.6398, "lr": 9.616724738675959e-06, "epoch": 0.06736842105263158, "percentage": 6.76, "elapsed_time": "0:52:43", "remaining_time": "12:07:33"} |
|
{"current_steps": 20, "total_steps": 296, "eval_loss": 0.565711259841919, "epoch": 0.06736842105263158, "percentage": 6.76, "elapsed_time": "0:57:39", "remaining_time": "13:15:37"} |
|
{"current_steps": 21, "total_steps": 296, "loss": 0.6231, "lr": 9.581881533101046e-06, "epoch": 0.07073684210526315, "percentage": 7.09, "elapsed_time": "0:59:32", "remaining_time": "12:59:48"} |
|
{"current_steps": 22, "total_steps": 296, "loss": 0.5259, "lr": 9.547038327526134e-06, "epoch": 0.07410526315789474, "percentage": 7.43, "elapsed_time": "1:01:26", "remaining_time": "12:45:09"} |
|
{"current_steps": 23, "total_steps": 296, "loss": 0.6304, "lr": 9.51219512195122e-06, "epoch": 0.07747368421052632, "percentage": 7.77, "elapsed_time": "1:03:16", "remaining_time": "12:31:07"} |
|
{"current_steps": 24, "total_steps": 296, "loss": 0.5735, "lr": 9.477351916376307e-06, "epoch": 0.0808421052631579, "percentage": 8.11, "elapsed_time": "1:05:04", "remaining_time": "12:17:30"} |
|
{"current_steps": 25, "total_steps": 296, "loss": 0.5123, "lr": 9.442508710801394e-06, "epoch": 0.08421052631578947, "percentage": 8.45, "elapsed_time": "1:06:53", "remaining_time": "12:05:08"} |
|
{"current_steps": 25, "total_steps": 296, "eval_loss": 0.5578904747962952, "epoch": 0.08421052631578947, "percentage": 8.45, "elapsed_time": "1:11:49", "remaining_time": "12:58:37"} |
|
{"current_steps": 26, "total_steps": 296, "loss": 0.547, "lr": 9.407665505226482e-06, "epoch": 0.08757894736842105, "percentage": 8.78, "elapsed_time": "1:13:39", "remaining_time": "12:44:52"} |
|
{"current_steps": 27, "total_steps": 296, "loss": 0.6267, "lr": 9.372822299651569e-06, "epoch": 0.09094736842105264, "percentage": 9.12, "elapsed_time": "1:15:28", "remaining_time": "12:32:00"} |
|
{"current_steps": 28, "total_steps": 296, "loss": 0.5053, "lr": 9.337979094076656e-06, "epoch": 0.09431578947368421, "percentage": 9.46, "elapsed_time": "1:17:13", "remaining_time": "12:19:12"} |
|
{"current_steps": 29, "total_steps": 296, "loss": 0.6092, "lr": 9.303135888501744e-06, "epoch": 0.09768421052631579, "percentage": 9.8, "elapsed_time": "1:19:00", "remaining_time": "12:07:28"} |
|
{"current_steps": 30, "total_steps": 296, "loss": 0.5098, "lr": 9.268292682926831e-06, "epoch": 0.10105263157894737, "percentage": 10.14, "elapsed_time": "1:20:44", "remaining_time": "11:55:54"} |
|
{"current_steps": 30, "total_steps": 296, "eval_loss": 0.5403761267662048, "epoch": 0.10105263157894737, "percentage": 10.14, "elapsed_time": "1:25:40", "remaining_time": "12:39:39"} |
|
{"current_steps": 31, "total_steps": 296, "loss": 0.5006, "lr": 9.233449477351917e-06, "epoch": 0.10442105263157894, "percentage": 10.47, "elapsed_time": "1:27:30", "remaining_time": "12:28:01"} |
|
{"current_steps": 32, "total_steps": 296, "loss": 0.5065, "lr": 9.198606271777004e-06, "epoch": 0.10778947368421053, "percentage": 10.81, "elapsed_time": "1:29:11", "remaining_time": "12:15:47"} |
|
{"current_steps": 33, "total_steps": 296, "loss": 0.5312, "lr": 9.163763066202092e-06, "epoch": 0.11115789473684211, "percentage": 11.15, "elapsed_time": "1:30:54", "remaining_time": "12:04:26"} |
|
{"current_steps": 34, "total_steps": 296, "loss": 0.5278, "lr": 9.12891986062718e-06, "epoch": 0.11452631578947368, "percentage": 11.49, "elapsed_time": "1:32:34", "remaining_time": "11:53:18"} |
|
{"current_steps": 35, "total_steps": 296, "loss": 0.5597, "lr": 9.094076655052265e-06, "epoch": 0.11789473684210526, "percentage": 11.82, "elapsed_time": "1:34:16", "remaining_time": "11:43:01"} |
|
{"current_steps": 35, "total_steps": 296, "eval_loss": 0.5175214409828186, "epoch": 0.11789473684210526, "percentage": 11.82, "elapsed_time": "1:39:12", "remaining_time": "12:19:49"} |
|
{"current_steps": 36, "total_steps": 296, "loss": 0.5023, "lr": 9.059233449477352e-06, "epoch": 0.12126315789473684, "percentage": 12.16, "elapsed_time": "1:40:55", "remaining_time": "12:08:53"} |
|
{"current_steps": 37, "total_steps": 296, "loss": 0.6115, "lr": 9.02439024390244e-06, "epoch": 0.12463157894736843, "percentage": 12.5, "elapsed_time": "1:42:43", "remaining_time": "11:59:01"} |
|
{"current_steps": 38, "total_steps": 296, "loss": 0.5682, "lr": 8.989547038327527e-06, "epoch": 0.128, "percentage": 12.84, "elapsed_time": "1:44:24", "remaining_time": "11:48:54"} |
|
{"current_steps": 39, "total_steps": 296, "loss": 0.5806, "lr": 8.954703832752613e-06, "epoch": 0.13136842105263158, "percentage": 13.18, "elapsed_time": "1:46:11", "remaining_time": "11:39:46"} |
|
{"current_steps": 40, "total_steps": 296, "loss": 0.4819, "lr": 8.9198606271777e-06, "epoch": 0.13473684210526315, "percentage": 13.51, "elapsed_time": "1:47:53", "remaining_time": "11:30:31"} |
|
{"current_steps": 40, "total_steps": 296, "eval_loss": 0.5115832090377808, "epoch": 0.13473684210526315, "percentage": 13.51, "elapsed_time": "1:52:49", "remaining_time": "12:02:05"} |
|
{"current_steps": 41, "total_steps": 296, "loss": 0.5607, "lr": 8.885017421602788e-06, "epoch": 0.13810526315789473, "percentage": 13.85, "elapsed_time": "1:54:37", "remaining_time": "11:52:56"} |
|
{"current_steps": 42, "total_steps": 296, "loss": 0.5767, "lr": 8.850174216027875e-06, "epoch": 0.1414736842105263, "percentage": 14.19, "elapsed_time": "1:56:27", "remaining_time": "11:44:14"} |
|
{"current_steps": 43, "total_steps": 296, "loss": 0.507, "lr": 8.815331010452962e-06, "epoch": 0.14484210526315788, "percentage": 14.53, "elapsed_time": "1:58:20", "remaining_time": "11:36:19"} |
|
{"current_steps": 44, "total_steps": 296, "loss": 0.4744, "lr": 8.78048780487805e-06, "epoch": 0.1482105263157895, "percentage": 14.86, "elapsed_time": "2:00:09", "remaining_time": "11:28:07"} |
|
{"current_steps": 45, "total_steps": 296, "loss": 0.4874, "lr": 8.745644599303137e-06, "epoch": 0.15157894736842106, "percentage": 15.2, "elapsed_time": "2:02:01", "remaining_time": "11:20:35"} |
|
{"current_steps": 45, "total_steps": 296, "eval_loss": 0.504241943359375, "epoch": 0.15157894736842106, "percentage": 15.2, "elapsed_time": "2:06:57", "remaining_time": "11:48:06"} |
|
{"current_steps": 46, "total_steps": 296, "loss": 0.5559, "lr": 8.710801393728223e-06, "epoch": 0.15494736842105264, "percentage": 15.54, "elapsed_time": "2:08:42", "remaining_time": "11:39:30"} |
|
{"current_steps": 47, "total_steps": 296, "loss": 0.5664, "lr": 8.67595818815331e-06, "epoch": 0.15831578947368422, "percentage": 15.88, "elapsed_time": "2:10:25", "remaining_time": "11:31:00"} |
|
{"current_steps": 48, "total_steps": 296, "loss": 0.4928, "lr": 8.641114982578398e-06, "epoch": 0.1616842105263158, "percentage": 16.22, "elapsed_time": "2:12:07", "remaining_time": "11:22:38"} |
|
{"current_steps": 49, "total_steps": 296, "loss": 0.5526, "lr": 8.606271777003485e-06, "epoch": 0.16505263157894737, "percentage": 16.55, "elapsed_time": "2:13:49", "remaining_time": "11:14:37"} |
|
{"current_steps": 50, "total_steps": 296, "loss": 0.5318, "lr": 8.571428571428571e-06, "epoch": 0.16842105263157894, "percentage": 16.89, "elapsed_time": "2:15:31", "remaining_time": "11:06:48"} |
|
{"current_steps": 50, "total_steps": 296, "eval_loss": 0.5086100101470947, "epoch": 0.16842105263157894, "percentage": 16.89, "elapsed_time": "2:20:27", "remaining_time": "11:31:04"} |
|
{"current_steps": 51, "total_steps": 296, "loss": 0.4785, "lr": 8.536585365853658e-06, "epoch": 0.17178947368421052, "percentage": 17.23, "elapsed_time": "2:22:11", "remaining_time": "11:23:02"} |
|
{"current_steps": 52, "total_steps": 296, "loss": 0.4902, "lr": 8.501742160278746e-06, "epoch": 0.1751578947368421, "percentage": 17.57, "elapsed_time": "2:23:55", "remaining_time": "11:15:21"} |
|
{"current_steps": 53, "total_steps": 296, "loss": 0.5576, "lr": 8.466898954703833e-06, "epoch": 0.17852631578947367, "percentage": 17.91, "elapsed_time": "2:25:39", "remaining_time": "11:07:49"} |
|
{"current_steps": 54, "total_steps": 296, "loss": 0.5326, "lr": 8.43205574912892e-06, "epoch": 0.18189473684210528, "percentage": 18.24, "elapsed_time": "2:27:22", "remaining_time": "11:00:26"} |
|
{"current_steps": 55, "total_steps": 296, "loss": 0.4955, "lr": 8.397212543554008e-06, "epoch": 0.18526315789473685, "percentage": 18.58, "elapsed_time": "2:29:11", "remaining_time": "10:53:44"} |
|
{"current_steps": 55, "total_steps": 296, "eval_loss": 0.5065380334854126, "epoch": 0.18526315789473685, "percentage": 18.58, "elapsed_time": "2:34:07", "remaining_time": "11:15:21"} |
|
{"current_steps": 56, "total_steps": 296, "loss": 0.5464, "lr": 8.362369337979095e-06, "epoch": 0.18863157894736843, "percentage": 18.92, "elapsed_time": "2:35:56", "remaining_time": "11:08:17"} |
|
{"current_steps": 57, "total_steps": 296, "loss": 0.5063, "lr": 8.327526132404183e-06, "epoch": 0.192, "percentage": 19.26, "elapsed_time": "2:37:45", "remaining_time": "11:01:27"} |
|
{"current_steps": 58, "total_steps": 296, "loss": 0.5212, "lr": 8.292682926829268e-06, "epoch": 0.19536842105263158, "percentage": 19.59, "elapsed_time": "2:39:33", "remaining_time": "10:54:44"} |
|
{"current_steps": 59, "total_steps": 296, "loss": 0.5516, "lr": 8.257839721254356e-06, "epoch": 0.19873684210526316, "percentage": 19.93, "elapsed_time": "2:41:17", "remaining_time": "10:47:53"} |
|
{"current_steps": 60, "total_steps": 296, "loss": 0.4956, "lr": 8.222996515679443e-06, "epoch": 0.20210526315789473, "percentage": 20.27, "elapsed_time": "2:42:59", "remaining_time": "10:41:07"} |
|
{"current_steps": 60, "total_steps": 296, "eval_loss": 0.48709771037101746, "epoch": 0.20210526315789473, "percentage": 20.27, "elapsed_time": "2:47:55", "remaining_time": "11:00:31"} |
|
{"current_steps": 61, "total_steps": 296, "loss": 0.5262, "lr": 8.18815331010453e-06, "epoch": 0.2054736842105263, "percentage": 20.61, "elapsed_time": "2:49:38", "remaining_time": "10:53:33"} |
|
{"current_steps": 62, "total_steps": 296, "loss": 0.4838, "lr": 8.153310104529616e-06, "epoch": 0.20884210526315788, "percentage": 20.95, "elapsed_time": "2:51:26", "remaining_time": "10:47:04"} |
|
{"current_steps": 63, "total_steps": 296, "loss": 0.4767, "lr": 8.118466898954704e-06, "epoch": 0.21221052631578946, "percentage": 21.28, "elapsed_time": "2:53:11", "remaining_time": "10:40:33"} |
|
{"current_steps": 64, "total_steps": 296, "loss": 0.5218, "lr": 8.083623693379791e-06, "epoch": 0.21557894736842106, "percentage": 21.62, "elapsed_time": "2:54:59", "remaining_time": "10:34:19"} |
|
{"current_steps": 65, "total_steps": 296, "loss": 0.5021, "lr": 8.048780487804879e-06, "epoch": 0.21894736842105264, "percentage": 21.96, "elapsed_time": "2:56:42", "remaining_time": "10:27:58"} |
|
{"current_steps": 65, "total_steps": 296, "eval_loss": 0.489128053188324, "epoch": 0.21894736842105264, "percentage": 21.96, "elapsed_time": "3:01:38", "remaining_time": "10:45:30"} |
|
{"current_steps": 66, "total_steps": 296, "loss": 0.4661, "lr": 8.013937282229966e-06, "epoch": 0.22231578947368422, "percentage": 22.3, "elapsed_time": "3:03:26", "remaining_time": "10:39:14"} |
|
{"current_steps": 67, "total_steps": 296, "loss": 0.5237, "lr": 7.979094076655053e-06, "epoch": 0.2256842105263158, "percentage": 22.64, "elapsed_time": "3:05:11", "remaining_time": "10:32:57"} |
|
{"current_steps": 68, "total_steps": 296, "loss": 0.5482, "lr": 7.94425087108014e-06, "epoch": 0.22905263157894737, "percentage": 22.97, "elapsed_time": "3:06:57", "remaining_time": "10:26:53"} |
|
{"current_steps": 69, "total_steps": 296, "loss": 0.5543, "lr": 7.909407665505228e-06, "epoch": 0.23242105263157894, "percentage": 23.31, "elapsed_time": "3:08:45", "remaining_time": "10:21:00"} |
|
{"current_steps": 70, "total_steps": 296, "loss": 0.5192, "lr": 7.874564459930314e-06, "epoch": 0.23578947368421052, "percentage": 23.65, "elapsed_time": "3:10:32", "remaining_time": "10:15:09"} |
|
{"current_steps": 70, "total_steps": 296, "eval_loss": 0.5080568790435791, "epoch": 0.23578947368421052, "percentage": 23.65, "elapsed_time": "3:15:27", "remaining_time": "10:31:04"} |
|
{"current_steps": 71, "total_steps": 296, "loss": 0.4802, "lr": 7.839721254355401e-06, "epoch": 0.2391578947368421, "percentage": 23.99, "elapsed_time": "3:17:10", "remaining_time": "10:24:51"} |
|
{"current_steps": 72, "total_steps": 296, "loss": 0.4789, "lr": 7.804878048780489e-06, "epoch": 0.24252631578947367, "percentage": 24.32, "elapsed_time": "3:18:58", "remaining_time": "10:19:01"} |
|
{"current_steps": 73, "total_steps": 296, "loss": 0.497, "lr": 7.770034843205574e-06, "epoch": 0.24589473684210525, "percentage": 24.66, "elapsed_time": "3:20:43", "remaining_time": "10:13:09"} |
|
{"current_steps": 74, "total_steps": 296, "loss": 0.5588, "lr": 7.735191637630662e-06, "epoch": 0.24926315789473685, "percentage": 25.0, "elapsed_time": "3:22:34", "remaining_time": "10:07:42"} |
|
{"current_steps": 75, "total_steps": 296, "loss": 0.4748, "lr": 7.70034843205575e-06, "epoch": 0.25263157894736843, "percentage": 25.34, "elapsed_time": "3:24:19", "remaining_time": "10:02:04"} |
|
{"current_steps": 75, "total_steps": 296, "eval_loss": 0.490384042263031, "epoch": 0.25263157894736843, "percentage": 25.34, "elapsed_time": "3:29:15", "remaining_time": "10:16:36"} |
|
{"current_steps": 76, "total_steps": 296, "loss": 0.4774, "lr": 7.665505226480837e-06, "epoch": 0.256, "percentage": 25.68, "elapsed_time": "3:31:02", "remaining_time": "10:10:55"} |
|
{"current_steps": 77, "total_steps": 296, "loss": 0.5141, "lr": 7.630662020905924e-06, "epoch": 0.2593684210526316, "percentage": 26.01, "elapsed_time": "3:32:46", "remaining_time": "10:05:10"} |
|
{"current_steps": 78, "total_steps": 296, "loss": 0.4826, "lr": 7.595818815331011e-06, "epoch": 0.26273684210526316, "percentage": 26.35, "elapsed_time": "3:34:34", "remaining_time": "9:59:43"} |
|
{"current_steps": 79, "total_steps": 296, "loss": 0.5098, "lr": 7.560975609756098e-06, "epoch": 0.26610526315789473, "percentage": 26.69, "elapsed_time": "3:36:20", "remaining_time": "9:54:15"} |
|
{"current_steps": 80, "total_steps": 296, "loss": 0.4881, "lr": 7.5261324041811855e-06, "epoch": 0.2694736842105263, "percentage": 27.03, "elapsed_time": "3:38:05", "remaining_time": "9:48:49"} |
|
{"current_steps": 80, "total_steps": 296, "eval_loss": 0.48383715748786926, "epoch": 0.2694736842105263, "percentage": 27.03, "elapsed_time": "3:43:00", "remaining_time": "10:02:08"} |
|
{"current_steps": 81, "total_steps": 296, "loss": 0.5106, "lr": 7.491289198606272e-06, "epoch": 0.2728421052631579, "percentage": 27.36, "elapsed_time": "3:44:45", "remaining_time": "9:56:35"} |
|
{"current_steps": 82, "total_steps": 296, "loss": 0.4802, "lr": 7.4564459930313594e-06, "epoch": 0.27621052631578946, "percentage": 27.7, "elapsed_time": "3:46:30", "remaining_time": "9:51:06"} |
|
{"current_steps": 83, "total_steps": 296, "loss": 0.4946, "lr": 7.421602787456447e-06, "epoch": 0.27957894736842104, "percentage": 28.04, "elapsed_time": "3:48:17", "remaining_time": "9:45:52"} |
|
{"current_steps": 84, "total_steps": 296, "loss": 0.5303, "lr": 7.386759581881534e-06, "epoch": 0.2829473684210526, "percentage": 28.38, "elapsed_time": "3:50:10", "remaining_time": "9:40:55"} |
|
{"current_steps": 85, "total_steps": 296, "loss": 0.5092, "lr": 7.35191637630662e-06, "epoch": 0.2863157894736842, "percentage": 28.72, "elapsed_time": "3:51:55", "remaining_time": "9:35:44"} |
|
{"current_steps": 85, "total_steps": 296, "eval_loss": 0.493765652179718, "epoch": 0.2863157894736842, "percentage": 28.72, "elapsed_time": "3:56:51", "remaining_time": "9:47:59"} |
|
{"current_steps": 86, "total_steps": 296, "loss": 0.5155, "lr": 7.317073170731707e-06, "epoch": 0.28968421052631577, "percentage": 29.05, "elapsed_time": "3:58:35", "remaining_time": "9:42:35"} |
|
{"current_steps": 87, "total_steps": 296, "loss": 0.5025, "lr": 7.282229965156795e-06, "epoch": 0.29305263157894734, "percentage": 29.39, "elapsed_time": "4:00:23", "remaining_time": "9:37:29"} |
|
{"current_steps": 88, "total_steps": 296, "loss": 0.4836, "lr": 7.247386759581882e-06, "epoch": 0.296421052631579, "percentage": 29.73, "elapsed_time": "4:02:12", "remaining_time": "9:32:28"} |
|
{"current_steps": 89, "total_steps": 296, "loss": 0.5086, "lr": 7.212543554006969e-06, "epoch": 0.29978947368421055, "percentage": 30.07, "elapsed_time": "4:04:05", "remaining_time": "9:27:42"} |
|
{"current_steps": 90, "total_steps": 296, "loss": 0.4971, "lr": 7.177700348432056e-06, "epoch": 0.3031578947368421, "percentage": 30.41, "elapsed_time": "4:05:56", "remaining_time": "9:22:55"} |
|
{"current_steps": 90, "total_steps": 296, "eval_loss": 0.4835096299648285, "epoch": 0.3031578947368421, "percentage": 30.41, "elapsed_time": "4:10:52", "remaining_time": "9:34:13"} |
|
{"current_steps": 91, "total_steps": 296, "loss": 0.444, "lr": 7.1428571428571436e-06, "epoch": 0.3065263157894737, "percentage": 30.74, "elapsed_time": "4:12:37", "remaining_time": "9:29:05"} |
|
{"current_steps": 92, "total_steps": 296, "loss": 0.486, "lr": 7.108013937282231e-06, "epoch": 0.3098947368421053, "percentage": 31.08, "elapsed_time": "4:14:20", "remaining_time": "9:23:57"} |
|
{"current_steps": 93, "total_steps": 296, "loss": 0.4929, "lr": 7.0731707317073175e-06, "epoch": 0.31326315789473685, "percentage": 31.42, "elapsed_time": "4:16:06", "remaining_time": "9:19:01"} |
|
{"current_steps": 94, "total_steps": 296, "loss": 0.5073, "lr": 7.038327526132405e-06, "epoch": 0.31663157894736843, "percentage": 31.76, "elapsed_time": "4:17:52", "remaining_time": "9:14:08"} |
|
{"current_steps": 95, "total_steps": 296, "loss": 0.4878, "lr": 7.003484320557492e-06, "epoch": 0.32, "percentage": 32.09, "elapsed_time": "4:19:34", "remaining_time": "9:09:11"} |
|
{"current_steps": 95, "total_steps": 296, "eval_loss": 0.4704912602901459, "epoch": 0.32, "percentage": 32.09, "elapsed_time": "4:24:30", "remaining_time": "9:19:37"} |
|
{"current_steps": 96, "total_steps": 296, "loss": 0.49, "lr": 6.96864111498258e-06, "epoch": 0.3233684210526316, "percentage": 32.43, "elapsed_time": "4:26:10", "remaining_time": "9:14:32"} |
|
{"current_steps": 97, "total_steps": 296, "loss": 0.5029, "lr": 6.9337979094076655e-06, "epoch": 0.32673684210526316, "percentage": 32.77, "elapsed_time": "4:27:53", "remaining_time": "9:09:34"} |
|
{"current_steps": 98, "total_steps": 296, "loss": 0.4621, "lr": 6.898954703832753e-06, "epoch": 0.33010526315789473, "percentage": 33.11, "elapsed_time": "4:29:36", "remaining_time": "9:04:42"} |
|
{"current_steps": 99, "total_steps": 296, "loss": 0.5222, "lr": 6.86411149825784e-06, "epoch": 0.3334736842105263, "percentage": 33.45, "elapsed_time": "4:31:21", "remaining_time": "8:59:57"} |
|
{"current_steps": 100, "total_steps": 296, "loss": 0.4762, "lr": 6.829268292682928e-06, "epoch": 0.3368421052631579, "percentage": 33.78, "elapsed_time": "4:34:04", "remaining_time": "8:57:12"} |
|
{"current_steps": 100, "total_steps": 296, "eval_loss": 0.4719935953617096, "epoch": 0.3368421052631579, "percentage": 33.78, "elapsed_time": "4:39:00", "remaining_time": "9:06:51"} |
|
{"current_steps": 101, "total_steps": 296, "loss": 0.4347, "lr": 6.794425087108014e-06, "epoch": 0.34021052631578946, "percentage": 34.12, "elapsed_time": "4:40:47", "remaining_time": "9:02:06"} |
|
{"current_steps": 102, "total_steps": 296, "loss": 0.5103, "lr": 6.759581881533102e-06, "epoch": 0.34357894736842104, "percentage": 34.46, "elapsed_time": "4:42:29", "remaining_time": "8:57:17"} |
|
{"current_steps": 103, "total_steps": 296, "loss": 0.4351, "lr": 6.724738675958189e-06, "epoch": 0.3469473684210526, "percentage": 34.8, "elapsed_time": "4:44:17", "remaining_time": "8:52:41"} |
|
{"current_steps": 104, "total_steps": 296, "loss": 0.5018, "lr": 6.6898954703832765e-06, "epoch": 0.3503157894736842, "percentage": 35.14, "elapsed_time": "4:45:59", "remaining_time": "8:47:58"} |
|
{"current_steps": 105, "total_steps": 296, "loss": 0.4511, "lr": 6.655052264808363e-06, "epoch": 0.35368421052631577, "percentage": 35.47, "elapsed_time": "4:47:42", "remaining_time": "8:43:21"} |
|
{"current_steps": 105, "total_steps": 296, "eval_loss": 0.49579426646232605, "epoch": 0.35368421052631577, "percentage": 35.47, "elapsed_time": "4:52:38", "remaining_time": "8:52:19"} |
|
{"current_steps": 106, "total_steps": 296, "loss": 0.5626, "lr": 6.62020905923345e-06, "epoch": 0.35705263157894734, "percentage": 35.81, "elapsed_time": "4:54:23", "remaining_time": "8:47:41"} |
|
{"current_steps": 107, "total_steps": 296, "loss": 0.4872, "lr": 6.585365853658538e-06, "epoch": 0.3604210526315789, "percentage": 36.15, "elapsed_time": "4:56:08", "remaining_time": "8:43:05"} |
|
{"current_steps": 108, "total_steps": 296, "loss": 0.4562, "lr": 6.5505226480836235e-06, "epoch": 0.36378947368421055, "percentage": 36.49, "elapsed_time": "4:57:52", "remaining_time": "8:38:31"} |
|
{"current_steps": 109, "total_steps": 296, "loss": 0.4512, "lr": 6.515679442508711e-06, "epoch": 0.3671578947368421, "percentage": 36.82, "elapsed_time": "4:59:35", "remaining_time": "8:33:59"} |
|
{"current_steps": 110, "total_steps": 296, "loss": 0.5213, "lr": 6.480836236933798e-06, "epoch": 0.3705263157894737, "percentage": 37.16, "elapsed_time": "5:01:17", "remaining_time": "8:29:26"} |
|
{"current_steps": 110, "total_steps": 296, "eval_loss": 0.48256850242614746, "epoch": 0.3705263157894737, "percentage": 37.16, "elapsed_time": "5:06:12", "remaining_time": "8:37:46"} |
|
{"current_steps": 111, "total_steps": 296, "loss": 0.5014, "lr": 6.445993031358886e-06, "epoch": 0.3738947368421053, "percentage": 37.5, "elapsed_time": "5:07:57", "remaining_time": "8:33:15"} |
|
{"current_steps": 112, "total_steps": 296, "loss": 0.4528, "lr": 6.411149825783972e-06, "epoch": 0.37726315789473686, "percentage": 37.84, "elapsed_time": "5:09:40", "remaining_time": "8:28:44"} |
|
{"current_steps": 113, "total_steps": 296, "loss": 0.4495, "lr": 6.37630662020906e-06, "epoch": 0.38063157894736843, "percentage": 38.18, "elapsed_time": "5:11:23", "remaining_time": "8:24:17"} |
|
{"current_steps": 114, "total_steps": 296, "loss": 0.5016, "lr": 6.341463414634147e-06, "epoch": 0.384, "percentage": 38.51, "elapsed_time": "5:13:06", "remaining_time": "8:19:52"} |
|
{"current_steps": 115, "total_steps": 296, "loss": 0.4569, "lr": 6.3066202090592345e-06, "epoch": 0.3873684210526316, "percentage": 38.85, "elapsed_time": "5:14:49", "remaining_time": "8:15:30"} |
|
{"current_steps": 115, "total_steps": 296, "eval_loss": 0.4829513430595398, "epoch": 0.3873684210526316, "percentage": 38.85, "elapsed_time": "5:19:45", "remaining_time": "8:23:16"} |
|
{"current_steps": 116, "total_steps": 296, "loss": 0.4074, "lr": 6.27177700348432e-06, "epoch": 0.39073684210526316, "percentage": 39.19, "elapsed_time": "5:21:26", "remaining_time": "8:18:46"} |
|
{"current_steps": 117, "total_steps": 296, "loss": 0.4507, "lr": 6.236933797909408e-06, "epoch": 0.39410526315789474, "percentage": 39.53, "elapsed_time": "5:23:15", "remaining_time": "8:14:32"} |
|
{"current_steps": 118, "total_steps": 296, "loss": 0.4851, "lr": 6.202090592334495e-06, "epoch": 0.3974736842105263, "percentage": 39.86, "elapsed_time": "5:24:57", "remaining_time": "8:10:11"} |
|
{"current_steps": 119, "total_steps": 296, "loss": 0.4862, "lr": 6.1672473867595825e-06, "epoch": 0.4008421052631579, "percentage": 40.2, "elapsed_time": "5:26:42", "remaining_time": "8:05:56"} |
|
{"current_steps": 120, "total_steps": 296, "loss": 0.4919, "lr": 6.132404181184669e-06, "epoch": 0.40421052631578946, "percentage": 40.54, "elapsed_time": "5:28:24", "remaining_time": "8:01:39"} |
|
{"current_steps": 120, "total_steps": 296, "eval_loss": 0.46267950534820557, "epoch": 0.40421052631578946, "percentage": 40.54, "elapsed_time": "5:33:20", "remaining_time": "8:08:53"} |
|
{"current_steps": 121, "total_steps": 296, "loss": 0.4472, "lr": 6.0975609756097564e-06, "epoch": 0.40757894736842104, "percentage": 40.88, "elapsed_time": "5:35:02", "remaining_time": "8:04:34"} |
|
{"current_steps": 122, "total_steps": 296, "loss": 0.434, "lr": 6.062717770034844e-06, "epoch": 0.4109473684210526, "percentage": 41.22, "elapsed_time": "5:36:46", "remaining_time": "8:00:19"} |
|
{"current_steps": 123, "total_steps": 296, "loss": 0.4624, "lr": 6.027874564459931e-06, "epoch": 0.4143157894736842, "percentage": 41.55, "elapsed_time": "5:38:31", "remaining_time": "7:56:07"} |
|
{"current_steps": 124, "total_steps": 296, "loss": 0.488, "lr": 5.993031358885018e-06, "epoch": 0.41768421052631577, "percentage": 41.89, "elapsed_time": "5:40:26", "remaining_time": "7:52:13"} |
|
{"current_steps": 125, "total_steps": 296, "loss": 0.4853, "lr": 5.958188153310105e-06, "epoch": 0.42105263157894735, "percentage": 42.23, "elapsed_time": "5:42:35", "remaining_time": "7:48:39"} |
|
{"current_steps": 125, "total_steps": 296, "eval_loss": 0.45646998286247253, "epoch": 0.42105263157894735, "percentage": 42.23, "elapsed_time": "5:47:30", "remaining_time": "7:55:24"} |
|
{"current_steps": 126, "total_steps": 296, "loss": 0.4685, "lr": 5.923344947735193e-06, "epoch": 0.4244210526315789, "percentage": 42.57, "elapsed_time": "5:49:55", "remaining_time": "7:52:07"} |
|
{"current_steps": 127, "total_steps": 296, "loss": 0.4606, "lr": 5.88850174216028e-06, "epoch": 0.42778947368421055, "percentage": 42.91, "elapsed_time": "5:52:11", "remaining_time": "7:48:40"} |
|
{"current_steps": 128, "total_steps": 296, "loss": 0.4822, "lr": 5.853658536585366e-06, "epoch": 0.43115789473684213, "percentage": 43.24, "elapsed_time": "5:54:23", "remaining_time": "7:45:08"} |
|
{"current_steps": 129, "total_steps": 296, "loss": 0.4591, "lr": 5.818815331010453e-06, "epoch": 0.4345263157894737, "percentage": 43.58, "elapsed_time": "5:56:25", "remaining_time": "7:41:24"} |
|
{"current_steps": 130, "total_steps": 296, "loss": 0.4638, "lr": 5.7839721254355405e-06, "epoch": 0.4378947368421053, "percentage": 43.92, "elapsed_time": "5:58:31", "remaining_time": "7:37:48"} |
|
{"current_steps": 130, "total_steps": 296, "eval_loss": 0.45767614245414734, "epoch": 0.4378947368421053, "percentage": 43.92, "elapsed_time": "6:03:27", "remaining_time": "7:44:06"} |
|
{"current_steps": 131, "total_steps": 296, "loss": 0.4872, "lr": 5.749128919860628e-06, "epoch": 0.44126315789473686, "percentage": 44.26, "elapsed_time": "6:05:12", "remaining_time": "7:39:59"} |
|
{"current_steps": 132, "total_steps": 296, "loss": 0.4403, "lr": 5.7142857142857145e-06, "epoch": 0.44463157894736843, "percentage": 44.59, "elapsed_time": "6:06:57", "remaining_time": "7:35:54"} |
|
{"current_steps": 133, "total_steps": 296, "loss": 0.4933, "lr": 5.679442508710802e-06, "epoch": 0.448, "percentage": 44.93, "elapsed_time": "6:08:42", "remaining_time": "7:31:52"} |
|
{"current_steps": 134, "total_steps": 296, "loss": 0.4297, "lr": 5.644599303135889e-06, "epoch": 0.4513684210526316, "percentage": 45.27, "elapsed_time": "6:10:29", "remaining_time": "7:27:54"} |
|
{"current_steps": 135, "total_steps": 296, "loss": 0.4941, "lr": 5.609756097560977e-06, "epoch": 0.45473684210526316, "percentage": 45.61, "elapsed_time": "6:12:14", "remaining_time": "7:23:56"} |
|
{"current_steps": 135, "total_steps": 296, "eval_loss": 0.45491233468055725, "epoch": 0.45473684210526316, "percentage": 45.61, "elapsed_time": "6:17:11", "remaining_time": "7:29:49"} |
|
{"current_steps": 136, "total_steps": 296, "loss": 0.4646, "lr": 5.574912891986063e-06, "epoch": 0.45810526315789474, "percentage": 45.95, "elapsed_time": "6:18:56", "remaining_time": "7:25:48"} |
|
{"current_steps": 137, "total_steps": 296, "loss": 0.4748, "lr": 5.540069686411151e-06, "epoch": 0.4614736842105263, "percentage": 46.28, "elapsed_time": "6:20:41", "remaining_time": "7:21:49"} |
|
{"current_steps": 138, "total_steps": 296, "loss": 0.4344, "lr": 5.505226480836237e-06, "epoch": 0.4648421052631579, "percentage": 46.62, "elapsed_time": "6:22:28", "remaining_time": "7:17:53"} |
|
{"current_steps": 139, "total_steps": 296, "loss": 0.51, "lr": 5.470383275261324e-06, "epoch": 0.46821052631578947, "percentage": 46.96, "elapsed_time": "6:24:14", "remaining_time": "7:13:59"} |
|
{"current_steps": 140, "total_steps": 296, "loss": 0.4661, "lr": 5.435540069686411e-06, "epoch": 0.47157894736842104, "percentage": 47.3, "elapsed_time": "6:26:04", "remaining_time": "7:10:12"} |
|
{"current_steps": 140, "total_steps": 296, "eval_loss": 0.455171138048172, "epoch": 0.47157894736842104, "percentage": 47.3, "elapsed_time": "6:31:00", "remaining_time": "7:15:42"} |
|
{"current_steps": 141, "total_steps": 296, "loss": 0.5014, "lr": 5.400696864111499e-06, "epoch": 0.4749473684210526, "percentage": 47.64, "elapsed_time": "6:32:49", "remaining_time": "7:11:50"} |
|
{"current_steps": 142, "total_steps": 296, "loss": 0.4457, "lr": 5.365853658536586e-06, "epoch": 0.4783157894736842, "percentage": 47.97, "elapsed_time": "6:34:35", "remaining_time": "7:07:55"} |
|
{"current_steps": 143, "total_steps": 296, "loss": 0.478, "lr": 5.331010452961673e-06, "epoch": 0.48168421052631577, "percentage": 48.31, "elapsed_time": "6:36:18", "remaining_time": "7:04:01"} |
|
{"current_steps": 144, "total_steps": 296, "loss": 0.4622, "lr": 5.29616724738676e-06, "epoch": 0.48505263157894735, "percentage": 48.65, "elapsed_time": "6:38:02", "remaining_time": "7:00:09"} |
|
{"current_steps": 145, "total_steps": 296, "loss": 0.4886, "lr": 5.261324041811847e-06, "epoch": 0.4884210526315789, "percentage": 48.99, "elapsed_time": "6:39:45", "remaining_time": "6:56:17"} |
|
{"current_steps": 145, "total_steps": 296, "eval_loss": 0.4507831335067749, "epoch": 0.4884210526315789, "percentage": 48.99, "elapsed_time": "6:44:41", "remaining_time": "7:01:26"} |
|
{"current_steps": 146, "total_steps": 296, "loss": 0.4533, "lr": 5.226480836236935e-06, "epoch": 0.4917894736842105, "percentage": 49.32, "elapsed_time": "6:46:28", "remaining_time": "6:57:37"} |
|
{"current_steps": 147, "total_steps": 296, "loss": 0.4403, "lr": 5.1916376306620205e-06, "epoch": 0.49515789473684213, "percentage": 49.66, "elapsed_time": "6:48:14", "remaining_time": "6:53:47"} |
|
{"current_steps": 148, "total_steps": 296, "loss": 0.4567, "lr": 5.156794425087108e-06, "epoch": 0.4985263157894737, "percentage": 50.0, "elapsed_time": "6:50:01", "remaining_time": "6:50:01"} |
|
{"current_steps": 149, "total_steps": 296, "loss": 0.4695, "lr": 5.121951219512195e-06, "epoch": 0.5018947368421053, "percentage": 50.34, "elapsed_time": "6:51:47", "remaining_time": "6:46:16"} |
|
{"current_steps": 150, "total_steps": 296, "loss": 0.4433, "lr": 5.087108013937283e-06, "epoch": 0.5052631578947369, "percentage": 50.68, "elapsed_time": "6:53:29", "remaining_time": "6:42:27"} |
|
{"current_steps": 150, "total_steps": 296, "eval_loss": 0.44684070348739624, "epoch": 0.5052631578947369, "percentage": 50.68, "elapsed_time": "6:58:25", "remaining_time": "6:47:15"} |
|
{"current_steps": 151, "total_steps": 296, "loss": 0.4717, "lr": 5.052264808362369e-06, "epoch": 0.5086315789473684, "percentage": 51.01, "elapsed_time": "7:00:08", "remaining_time": "6:43:26"} |
|
{"current_steps": 152, "total_steps": 296, "loss": 0.5013, "lr": 5.017421602787457e-06, "epoch": 0.512, "percentage": 51.35, "elapsed_time": "7:01:47", "remaining_time": "6:39:35"} |
|
{"current_steps": 153, "total_steps": 296, "loss": 0.4592, "lr": 4.982578397212544e-06, "epoch": 0.5153684210526316, "percentage": 51.69, "elapsed_time": "7:03:31", "remaining_time": "6:35:50"} |
|
{"current_steps": 154, "total_steps": 296, "loss": 0.4714, "lr": 4.947735191637631e-06, "epoch": 0.5187368421052632, "percentage": 52.03, "elapsed_time": "7:05:09", "remaining_time": "6:32:01"} |
|
{"current_steps": 155, "total_steps": 296, "loss": 0.4819, "lr": 4.912891986062718e-06, "epoch": 0.5221052631578947, "percentage": 52.36, "elapsed_time": "7:06:48", "remaining_time": "6:28:15"} |
|
{"current_steps": 155, "total_steps": 296, "eval_loss": 0.4551759660243988, "epoch": 0.5221052631578947, "percentage": 52.36, "elapsed_time": "7:11:44", "remaining_time": "6:32:44"} |
|
{"current_steps": 156, "total_steps": 296, "loss": 0.4333, "lr": 4.8780487804878055e-06, "epoch": 0.5254736842105263, "percentage": 52.7, "elapsed_time": "7:13:26", "remaining_time": "6:28:59"} |
|
{"current_steps": 157, "total_steps": 296, "loss": 0.4343, "lr": 4.843205574912893e-06, "epoch": 0.5288421052631579, "percentage": 53.04, "elapsed_time": "7:15:13", "remaining_time": "6:25:19"} |
|
{"current_steps": 158, "total_steps": 296, "loss": 0.4909, "lr": 4.8083623693379794e-06, "epoch": 0.5322105263157895, "percentage": 53.38, "elapsed_time": "7:16:56", "remaining_time": "6:21:37"} |
|
{"current_steps": 159, "total_steps": 296, "loss": 0.444, "lr": 4.773519163763067e-06, "epoch": 0.535578947368421, "percentage": 53.72, "elapsed_time": "7:18:43", "remaining_time": "6:18:00"} |
|
{"current_steps": 160, "total_steps": 296, "loss": 0.4794, "lr": 4.738675958188153e-06, "epoch": 0.5389473684210526, "percentage": 54.05, "elapsed_time": "7:20:31", "remaining_time": "6:14:26"} |
|
{"current_steps": 160, "total_steps": 296, "eval_loss": 0.4603857398033142, "epoch": 0.5389473684210526, "percentage": 54.05, "elapsed_time": "7:25:27", "remaining_time": "6:18:38"} |
|
{"current_steps": 161, "total_steps": 296, "loss": 0.4511, "lr": 4.703832752613241e-06, "epoch": 0.5423157894736842, "percentage": 54.39, "elapsed_time": "7:27:21", "remaining_time": "6:15:06"} |
|
{"current_steps": 162, "total_steps": 296, "loss": 0.4495, "lr": 4.668989547038328e-06, "epoch": 0.5456842105263158, "percentage": 54.73, "elapsed_time": "7:29:07", "remaining_time": "6:11:30"} |
|
{"current_steps": 163, "total_steps": 296, "loss": 0.4634, "lr": 4.634146341463416e-06, "epoch": 0.5490526315789473, "percentage": 55.07, "elapsed_time": "7:30:57", "remaining_time": "6:07:57"} |
|
{"current_steps": 164, "total_steps": 296, "loss": 0.5176, "lr": 4.599303135888502e-06, "epoch": 0.5524210526315789, "percentage": 55.41, "elapsed_time": "7:32:43", "remaining_time": "6:04:22"} |
|
{"current_steps": 165, "total_steps": 296, "loss": 0.4272, "lr": 4.56445993031359e-06, "epoch": 0.5557894736842105, "percentage": 55.74, "elapsed_time": "7:34:34", "remaining_time": "6:00:54"} |
|
{"current_steps": 165, "total_steps": 296, "eval_loss": 0.4549420475959778, "epoch": 0.5557894736842105, "percentage": 55.74, "elapsed_time": "7:39:30", "remaining_time": "6:04:49"} |
|
{"current_steps": 166, "total_steps": 296, "loss": 0.4548, "lr": 4.529616724738676e-06, "epoch": 0.5591578947368421, "percentage": 56.08, "elapsed_time": "7:41:12", "remaining_time": "6:01:11"} |
|
{"current_steps": 167, "total_steps": 296, "loss": 0.5121, "lr": 4.4947735191637636e-06, "epoch": 0.5625263157894737, "percentage": 56.42, "elapsed_time": "7:42:58", "remaining_time": "5:57:37"} |
|
{"current_steps": 168, "total_steps": 296, "loss": 0.452, "lr": 4.45993031358885e-06, "epoch": 0.5658947368421052, "percentage": 56.76, "elapsed_time": "7:44:38", "remaining_time": "5:54:00"} |
|
{"current_steps": 169, "total_steps": 296, "loss": 0.4668, "lr": 4.4250871080139375e-06, "epoch": 0.5692631578947368, "percentage": 57.09, "elapsed_time": "7:46:18", "remaining_time": "5:50:25"} |
|
{"current_steps": 170, "total_steps": 296, "loss": 0.4615, "lr": 4.390243902439025e-06, "epoch": 0.5726315789473684, "percentage": 57.43, "elapsed_time": "7:47:57", "remaining_time": "5:46:50"} |
|
{"current_steps": 170, "total_steps": 296, "eval_loss": 0.45792800188064575, "epoch": 0.5726315789473684, "percentage": 57.43, "elapsed_time": "7:52:53", "remaining_time": "5:50:30"} |
|
{"current_steps": 171, "total_steps": 296, "loss": 0.4643, "lr": 4.3554006968641115e-06, "epoch": 0.576, "percentage": 57.77, "elapsed_time": "7:54:40", "remaining_time": "5:46:59"} |
|
{"current_steps": 172, "total_steps": 296, "loss": 0.4511, "lr": 4.320557491289199e-06, "epoch": 0.5793684210526315, "percentage": 58.11, "elapsed_time": "7:56:25", "remaining_time": "5:43:28"} |
|
{"current_steps": 173, "total_steps": 296, "loss": 0.4903, "lr": 4.2857142857142855e-06, "epoch": 0.5827368421052631, "percentage": 58.45, "elapsed_time": "7:58:08", "remaining_time": "5:39:57"} |
|
{"current_steps": 174, "total_steps": 296, "loss": 0.4845, "lr": 4.250871080139373e-06, "epoch": 0.5861052631578947, "percentage": 58.78, "elapsed_time": "7:59:48", "remaining_time": "5:36:24"} |
|
{"current_steps": 175, "total_steps": 296, "loss": 0.4417, "lr": 4.21602787456446e-06, "epoch": 0.5894736842105263, "percentage": 59.12, "elapsed_time": "8:01:29", "remaining_time": "5:32:55"} |
|
{"current_steps": 175, "total_steps": 296, "eval_loss": 0.4459608197212219, "epoch": 0.5894736842105263, "percentage": 59.12, "elapsed_time": "8:06:25", "remaining_time": "5:36:19"} |
|
{"current_steps": 176, "total_steps": 296, "loss": 0.4188, "lr": 4.181184668989548e-06, "epoch": 0.592842105263158, "percentage": 59.46, "elapsed_time": "8:08:07", "remaining_time": "5:32:48"} |
|
{"current_steps": 177, "total_steps": 296, "loss": 0.465, "lr": 4.146341463414634e-06, "epoch": 0.5962105263157895, "percentage": 59.8, "elapsed_time": "8:09:52", "remaining_time": "5:29:21"} |
|
{"current_steps": 178, "total_steps": 296, "loss": 0.4528, "lr": 4.111498257839722e-06, "epoch": 0.5995789473684211, "percentage": 60.14, "elapsed_time": "8:11:35", "remaining_time": "5:25:52"} |
|
{"current_steps": 179, "total_steps": 296, "loss": 0.4392, "lr": 4.076655052264808e-06, "epoch": 0.6029473684210527, "percentage": 60.47, "elapsed_time": "8:13:17", "remaining_time": "5:22:25"} |
|
{"current_steps": 180, "total_steps": 296, "loss": 0.4275, "lr": 4.041811846689896e-06, "epoch": 0.6063157894736843, "percentage": 60.81, "elapsed_time": "8:15:07", "remaining_time": "5:19:04"} |
|
{"current_steps": 180, "total_steps": 296, "eval_loss": 0.44529595971107483, "epoch": 0.6063157894736843, "percentage": 60.81, "elapsed_time": "8:20:03", "remaining_time": "5:22:15"} |
|
{"current_steps": 181, "total_steps": 296, "loss": 0.436, "lr": 4.006968641114983e-06, "epoch": 0.6096842105263158, "percentage": 61.15, "elapsed_time": "8:21:54", "remaining_time": "5:18:53"} |
|
{"current_steps": 182, "total_steps": 296, "loss": 0.4095, "lr": 3.97212543554007e-06, "epoch": 0.6130526315789474, "percentage": 61.49, "elapsed_time": "8:23:40", "remaining_time": "5:15:29"} |
|
{"current_steps": 183, "total_steps": 296, "loss": 0.4744, "lr": 3.937282229965157e-06, "epoch": 0.616421052631579, "percentage": 61.82, "elapsed_time": "8:25:25", "remaining_time": "5:12:05"} |
|
{"current_steps": 184, "total_steps": 296, "loss": 0.4601, "lr": 3.902439024390244e-06, "epoch": 0.6197894736842106, "percentage": 62.16, "elapsed_time": "8:27:09", "remaining_time": "5:08:42"} |
|
{"current_steps": 185, "total_steps": 296, "loss": 0.4303, "lr": 3.867595818815331e-06, "epoch": 0.6231578947368421, "percentage": 62.5, "elapsed_time": "8:28:52", "remaining_time": "5:05:19"} |
|
{"current_steps": 185, "total_steps": 296, "eval_loss": 0.44683924317359924, "epoch": 0.6231578947368421, "percentage": 62.5, "elapsed_time": "8:33:48", "remaining_time": "5:08:17"} |
|
{"current_steps": 186, "total_steps": 296, "loss": 0.3899, "lr": 3.832752613240418e-06, "epoch": 0.6265263157894737, "percentage": 62.84, "elapsed_time": "8:36:11", "remaining_time": "5:05:16"} |
|
{"current_steps": 187, "total_steps": 296, "loss": 0.4262, "lr": 3.7979094076655053e-06, "epoch": 0.6298947368421053, "percentage": 63.18, "elapsed_time": "8:38:52", "remaining_time": "5:02:26"} |
|
{"current_steps": 188, "total_steps": 296, "loss": 0.4317, "lr": 3.7630662020905927e-06, "epoch": 0.6332631578947369, "percentage": 63.51, "elapsed_time": "8:41:33", "remaining_time": "4:59:37"} |
|
{"current_steps": 189, "total_steps": 296, "loss": 0.4372, "lr": 3.7282229965156797e-06, "epoch": 0.6366315789473684, "percentage": 63.85, "elapsed_time": "8:44:09", "remaining_time": "4:56:44"} |
|
{"current_steps": 190, "total_steps": 296, "loss": 0.4286, "lr": 3.693379790940767e-06, "epoch": 0.64, "percentage": 64.19, "elapsed_time": "8:46:53", "remaining_time": "4:53:57"} |
|
{"current_steps": 190, "total_steps": 296, "eval_loss": 0.43968334794044495, "epoch": 0.64, "percentage": 64.19, "elapsed_time": "8:51:49", "remaining_time": "4:56:42"} |
|
{"current_steps": 191, "total_steps": 296, "loss": 0.4094, "lr": 3.6585365853658537e-06, "epoch": 0.6433684210526316, "percentage": 64.53, "elapsed_time": "8:54:05", "remaining_time": "4:53:36"} |
|
{"current_steps": 192, "total_steps": 296, "loss": 0.4906, "lr": 3.623693379790941e-06, "epoch": 0.6467368421052632, "percentage": 64.86, "elapsed_time": "8:56:11", "remaining_time": "4:50:26"} |
|
{"current_steps": 193, "total_steps": 296, "loss": 0.4557, "lr": 3.588850174216028e-06, "epoch": 0.6501052631578947, "percentage": 65.2, "elapsed_time": "8:58:23", "remaining_time": "4:47:19"} |
|
{"current_steps": 194, "total_steps": 296, "loss": 0.3978, "lr": 3.5540069686411155e-06, "epoch": 0.6534736842105263, "percentage": 65.54, "elapsed_time": "9:00:25", "remaining_time": "4:44:08"} |
|
{"current_steps": 195, "total_steps": 296, "loss": 0.4655, "lr": 3.5191637630662025e-06, "epoch": 0.6568421052631579, "percentage": 65.88, "elapsed_time": "9:02:25", "remaining_time": "4:40:56"} |
|
{"current_steps": 195, "total_steps": 296, "eval_loss": 0.4368743896484375, "epoch": 0.6568421052631579, "percentage": 65.88, "elapsed_time": "9:07:21", "remaining_time": "4:43:30"} |
|
{"current_steps": 196, "total_steps": 296, "loss": 0.4158, "lr": 3.48432055749129e-06, "epoch": 0.6602105263157895, "percentage": 66.22, "elapsed_time": "9:09:09", "remaining_time": "4:40:10"} |
|
{"current_steps": 197, "total_steps": 296, "loss": 0.4567, "lr": 3.4494773519163764e-06, "epoch": 0.663578947368421, "percentage": 66.55, "elapsed_time": "9:10:59", "remaining_time": "4:36:53"} |
|
{"current_steps": 198, "total_steps": 296, "loss": 0.3909, "lr": 3.414634146341464e-06, "epoch": 0.6669473684210526, "percentage": 66.89, "elapsed_time": "9:12:43", "remaining_time": "4:33:34"} |
|
{"current_steps": 199, "total_steps": 296, "loss": 0.4208, "lr": 3.379790940766551e-06, "epoch": 0.6703157894736842, "percentage": 67.23, "elapsed_time": "9:14:33", "remaining_time": "4:30:18"} |
|
{"current_steps": 200, "total_steps": 296, "loss": 0.386, "lr": 3.3449477351916382e-06, "epoch": 0.6736842105263158, "percentage": 67.57, "elapsed_time": "9:16:19", "remaining_time": "4:27:02"} |
|
{"current_steps": 200, "total_steps": 296, "eval_loss": 0.44159650802612305, "epoch": 0.6736842105263158, "percentage": 67.57, "elapsed_time": "9:21:15", "remaining_time": "4:29:24"} |
|
{"current_steps": 201, "total_steps": 296, "loss": 0.4443, "lr": 3.310104529616725e-06, "epoch": 0.6770526315789474, "percentage": 67.91, "elapsed_time": "9:23:04", "remaining_time": "4:26:08"} |
|
{"current_steps": 202, "total_steps": 296, "loss": 0.4267, "lr": 3.2752613240418118e-06, "epoch": 0.6804210526315789, "percentage": 68.24, "elapsed_time": "9:24:53", "remaining_time": "4:22:52"} |
|
{"current_steps": 203, "total_steps": 296, "loss": 0.4117, "lr": 3.240418118466899e-06, "epoch": 0.6837894736842105, "percentage": 68.58, "elapsed_time": "9:26:42", "remaining_time": "4:19:37"} |
|
{"current_steps": 204, "total_steps": 296, "loss": 0.4249, "lr": 3.205574912891986e-06, "epoch": 0.6871578947368421, "percentage": 68.92, "elapsed_time": "9:28:29", "remaining_time": "4:16:22"} |
|
{"current_steps": 205, "total_steps": 296, "loss": 0.4129, "lr": 3.1707317073170736e-06, "epoch": 0.6905263157894737, "percentage": 69.26, "elapsed_time": "9:30:13", "remaining_time": "4:13:07"} |
|
{"current_steps": 205, "total_steps": 296, "eval_loss": 0.4336434602737427, "epoch": 0.6905263157894737, "percentage": 69.26, "elapsed_time": "9:35:09", "remaining_time": "4:15:18"} |
|
{"current_steps": 206, "total_steps": 296, "loss": 0.405, "lr": 3.13588850174216e-06, "epoch": 0.6938947368421052, "percentage": 69.59, "elapsed_time": "9:37:05", "remaining_time": "4:12:07"} |
|
{"current_steps": 207, "total_steps": 296, "loss": 0.4217, "lr": 3.1010452961672475e-06, "epoch": 0.6972631578947368, "percentage": 69.93, "elapsed_time": "9:38:54", "remaining_time": "4:08:54"} |
|
{"current_steps": 208, "total_steps": 296, "loss": 0.4415, "lr": 3.0662020905923345e-06, "epoch": 0.7006315789473684, "percentage": 70.27, "elapsed_time": "9:40:44", "remaining_time": "4:05:41"} |
|
{"current_steps": 209, "total_steps": 296, "loss": 0.44, "lr": 3.031358885017422e-06, "epoch": 0.704, "percentage": 70.61, "elapsed_time": "9:42:35", "remaining_time": "4:02:30"} |
|
{"current_steps": 210, "total_steps": 296, "loss": 0.3851, "lr": 2.996515679442509e-06, "epoch": 0.7073684210526315, "percentage": 70.95, "elapsed_time": "9:44:27", "remaining_time": "3:59:21"} |
|
{"current_steps": 210, "total_steps": 296, "eval_loss": 0.4335211217403412, "epoch": 0.7073684210526315, "percentage": 70.95, "elapsed_time": "9:49:23", "remaining_time": "4:01:22"} |
|
{"current_steps": 211, "total_steps": 296, "loss": 0.4541, "lr": 2.9616724738675963e-06, "epoch": 0.7107368421052631, "percentage": 71.28, "elapsed_time": "9:51:12", "remaining_time": "3:58:09"} |
|
{"current_steps": 212, "total_steps": 296, "loss": 0.4251, "lr": 2.926829268292683e-06, "epoch": 0.7141052631578947, "percentage": 71.62, "elapsed_time": "9:53:04", "remaining_time": "3:54:59"} |
|
{"current_steps": 213, "total_steps": 296, "loss": 0.4162, "lr": 2.8919860627177703e-06, "epoch": 0.7174736842105263, "percentage": 71.96, "elapsed_time": "9:54:52", "remaining_time": "3:51:48"} |
|
{"current_steps": 214, "total_steps": 296, "loss": 0.4213, "lr": 2.8571428571428573e-06, "epoch": 0.7208421052631578, "percentage": 72.3, "elapsed_time": "9:56:50", "remaining_time": "3:48:41"} |
|
{"current_steps": 215, "total_steps": 296, "loss": 0.4516, "lr": 2.8222996515679447e-06, "epoch": 0.7242105263157895, "percentage": 72.64, "elapsed_time": "9:58:38", "remaining_time": "3:45:31"} |
|
{"current_steps": 215, "total_steps": 296, "eval_loss": 0.43385687470436096, "epoch": 0.7242105263157895, "percentage": 72.64, "elapsed_time": "10:03:34", "remaining_time": "3:47:23"} |
|
{"current_steps": 216, "total_steps": 296, "loss": 0.4376, "lr": 2.7874564459930316e-06, "epoch": 0.7275789473684211, "percentage": 72.97, "elapsed_time": "10:05:34", "remaining_time": "3:44:17"} |
|
{"current_steps": 217, "total_steps": 296, "loss": 0.4485, "lr": 2.7526132404181186e-06, "epoch": 0.7309473684210527, "percentage": 73.31, "elapsed_time": "10:07:32", "remaining_time": "3:41:10"} |
|
{"current_steps": 218, "total_steps": 296, "loss": 0.4537, "lr": 2.7177700348432056e-06, "epoch": 0.7343157894736843, "percentage": 73.65, "elapsed_time": "10:09:28", "remaining_time": "3:38:04"} |
|
{"current_steps": 219, "total_steps": 296, "loss": 0.4366, "lr": 2.682926829268293e-06, "epoch": 0.7376842105263158, "percentage": 73.99, "elapsed_time": "10:11:25", "remaining_time": "3:34:58"} |
|
{"current_steps": 220, "total_steps": 296, "loss": 0.3995, "lr": 2.64808362369338e-06, "epoch": 0.7410526315789474, "percentage": 74.32, "elapsed_time": "10:13:24", "remaining_time": "3:31:54"} |
|
{"current_steps": 220, "total_steps": 296, "eval_loss": 0.43131592869758606, "epoch": 0.7410526315789474, "percentage": 74.32, "elapsed_time": "10:18:20", "remaining_time": "3:33:36"} |
|
{"current_steps": 221, "total_steps": 296, "loss": 0.3878, "lr": 2.6132404181184674e-06, "epoch": 0.744421052631579, "percentage": 74.66, "elapsed_time": "10:20:14", "remaining_time": "3:30:29"} |
|
{"current_steps": 222, "total_steps": 296, "loss": 0.4301, "lr": 2.578397212543554e-06, "epoch": 0.7477894736842106, "percentage": 75.0, "elapsed_time": "10:22:05", "remaining_time": "3:27:21"} |
|
{"current_steps": 223, "total_steps": 296, "loss": 0.404, "lr": 2.5435540069686414e-06, "epoch": 0.7511578947368421, "percentage": 75.34, "elapsed_time": "10:24:08", "remaining_time": "3:24:18"} |
|
{"current_steps": 224, "total_steps": 296, "loss": 0.4433, "lr": 2.5087108013937284e-06, "epoch": 0.7545263157894737, "percentage": 75.68, "elapsed_time": "10:26:04", "remaining_time": "3:21:14"} |
|
{"current_steps": 225, "total_steps": 296, "loss": 0.3488, "lr": 2.4738675958188153e-06, "epoch": 0.7578947368421053, "percentage": 76.01, "elapsed_time": "10:28:00", "remaining_time": "3:18:10"} |
|
{"current_steps": 225, "total_steps": 296, "eval_loss": 0.432211309671402, "epoch": 0.7578947368421053, "percentage": 76.01, "elapsed_time": "10:32:56", "remaining_time": "3:19:43"} |
|
{"current_steps": 226, "total_steps": 296, "loss": 0.4401, "lr": 2.4390243902439027e-06, "epoch": 0.7612631578947369, "percentage": 76.35, "elapsed_time": "10:34:48", "remaining_time": "3:16:37"} |
|
{"current_steps": 227, "total_steps": 296, "loss": 0.4097, "lr": 2.4041811846689897e-06, "epoch": 0.7646315789473684, "percentage": 76.69, "elapsed_time": "10:36:40", "remaining_time": "3:13:31"} |
|
{"current_steps": 228, "total_steps": 296, "loss": 0.4486, "lr": 2.3693379790940767e-06, "epoch": 0.768, "percentage": 77.03, "elapsed_time": "10:38:29", "remaining_time": "3:10:25"} |
|
{"current_steps": 229, "total_steps": 296, "loss": 0.3738, "lr": 2.334494773519164e-06, "epoch": 0.7713684210526316, "percentage": 77.36, "elapsed_time": "10:40:25", "remaining_time": "3:07:22"} |
|
{"current_steps": 230, "total_steps": 296, "loss": 0.4874, "lr": 2.299651567944251e-06, "epoch": 0.7747368421052632, "percentage": 77.7, "elapsed_time": "10:42:19", "remaining_time": "3:04:19"} |
|
{"current_steps": 230, "total_steps": 296, "eval_loss": 0.4298974871635437, "epoch": 0.7747368421052632, "percentage": 77.7, "elapsed_time": "10:47:15", "remaining_time": "3:05:44"} |
|
{"current_steps": 231, "total_steps": 296, "loss": 0.4251, "lr": 2.264808362369338e-06, "epoch": 0.7781052631578947, "percentage": 78.04, "elapsed_time": "10:49:29", "remaining_time": "3:02:45"} |
|
{"current_steps": 232, "total_steps": 296, "loss": 0.4927, "lr": 2.229965156794425e-06, "epoch": 0.7814736842105263, "percentage": 78.38, "elapsed_time": "10:51:35", "remaining_time": "2:59:45"} |
|
{"current_steps": 233, "total_steps": 296, "loss": 0.4914, "lr": 2.1951219512195125e-06, "epoch": 0.7848421052631579, "percentage": 78.72, "elapsed_time": "10:53:35", "remaining_time": "2:56:43"} |
|
{"current_steps": 234, "total_steps": 296, "loss": 0.409, "lr": 2.1602787456445995e-06, "epoch": 0.7882105263157895, "percentage": 79.05, "elapsed_time": "10:55:30", "remaining_time": "2:53:40"} |
|
{"current_steps": 235, "total_steps": 296, "loss": 0.4217, "lr": 2.1254355400696864e-06, "epoch": 0.791578947368421, "percentage": 79.39, "elapsed_time": "10:57:21", "remaining_time": "2:50:37"} |
|
{"current_steps": 235, "total_steps": 296, "eval_loss": 0.4288136661052704, "epoch": 0.791578947368421, "percentage": 79.39, "elapsed_time": "11:02:17", "remaining_time": "2:51:54"} |
|
{"current_steps": 236, "total_steps": 296, "loss": 0.4629, "lr": 2.090592334494774e-06, "epoch": 0.7949473684210526, "percentage": 79.73, "elapsed_time": "11:04:15", "remaining_time": "2:48:52"} |
|
{"current_steps": 237, "total_steps": 296, "loss": 0.4349, "lr": 2.055749128919861e-06, "epoch": 0.7983157894736842, "percentage": 80.07, "elapsed_time": "11:06:07", "remaining_time": "2:45:49"} |
|
{"current_steps": 238, "total_steps": 296, "loss": 0.4051, "lr": 2.020905923344948e-06, "epoch": 0.8016842105263158, "percentage": 80.41, "elapsed_time": "11:07:59", "remaining_time": "2:42:47"} |
|
{"current_steps": 239, "total_steps": 296, "loss": 0.4662, "lr": 1.986062717770035e-06, "epoch": 0.8050526315789474, "percentage": 80.74, "elapsed_time": "11:09:51", "remaining_time": "2:39:45"} |
|
{"current_steps": 240, "total_steps": 296, "loss": 0.4295, "lr": 1.951219512195122e-06, "epoch": 0.8084210526315789, "percentage": 81.08, "elapsed_time": "11:11:50", "remaining_time": "2:36:45"} |
|
{"current_steps": 240, "total_steps": 296, "eval_loss": 0.4299337863922119, "epoch": 0.8084210526315789, "percentage": 81.08, "elapsed_time": "11:16:46", "remaining_time": "2:37:54"} |
|
{"current_steps": 241, "total_steps": 296, "loss": 0.4544, "lr": 1.916376306620209e-06, "epoch": 0.8117894736842105, "percentage": 81.42, "elapsed_time": "11:18:46", "remaining_time": "2:34:54"} |
|
{"current_steps": 242, "total_steps": 296, "loss": 0.4071, "lr": 1.8815331010452964e-06, "epoch": 0.8151578947368421, "percentage": 81.76, "elapsed_time": "11:20:41", "remaining_time": "2:31:53"} |
|
{"current_steps": 243, "total_steps": 296, "loss": 0.4536, "lr": 1.8466898954703836e-06, "epoch": 0.8185263157894737, "percentage": 82.09, "elapsed_time": "11:22:38", "remaining_time": "2:28:53"} |
|
{"current_steps": 244, "total_steps": 296, "loss": 0.4182, "lr": 1.8118466898954705e-06, "epoch": 0.8218947368421052, "percentage": 82.43, "elapsed_time": "11:24:40", "remaining_time": "2:25:54"} |
|
{"current_steps": 245, "total_steps": 296, "loss": 0.4777, "lr": 1.7770034843205577e-06, "epoch": 0.8252631578947368, "percentage": 82.77, "elapsed_time": "11:26:37", "remaining_time": "2:22:55"} |
|
{"current_steps": 245, "total_steps": 296, "eval_loss": 0.43184179067611694, "epoch": 0.8252631578947368, "percentage": 82.77, "elapsed_time": "11:31:33", "remaining_time": "2:23:57"} |
|
{"current_steps": 246, "total_steps": 296, "loss": 0.4165, "lr": 1.742160278745645e-06, "epoch": 0.8286315789473684, "percentage": 83.11, "elapsed_time": "11:33:16", "remaining_time": "2:20:54"} |
|
{"current_steps": 247, "total_steps": 296, "loss": 0.3889, "lr": 1.707317073170732e-06, "epoch": 0.832, "percentage": 83.45, "elapsed_time": "11:35:00", "remaining_time": "2:17:52"} |
|
{"current_steps": 248, "total_steps": 296, "loss": 0.4439, "lr": 1.6724738675958191e-06, "epoch": 0.8353684210526315, "percentage": 83.78, "elapsed_time": "11:36:49", "remaining_time": "2:14:52"} |
|
{"current_steps": 249, "total_steps": 296, "loss": 0.4939, "lr": 1.6376306620209059e-06, "epoch": 0.8387368421052631, "percentage": 84.12, "elapsed_time": "11:38:46", "remaining_time": "2:11:53"} |
|
{"current_steps": 250, "total_steps": 296, "loss": 0.4612, "lr": 1.602787456445993e-06, "epoch": 0.8421052631578947, "percentage": 84.46, "elapsed_time": "11:40:34", "remaining_time": "2:08:54"} |
|
{"current_steps": 250, "total_steps": 296, "eval_loss": 0.42705872654914856, "epoch": 0.8421052631578947, "percentage": 84.46, "elapsed_time": "11:45:29", "remaining_time": "2:09:48"} |
|
{"current_steps": 251, "total_steps": 296, "loss": 0.401, "lr": 1.56794425087108e-06, "epoch": 0.8454736842105263, "percentage": 84.8, "elapsed_time": "11:47:18", "remaining_time": "2:06:48"} |
|
{"current_steps": 252, "total_steps": 296, "loss": 0.4141, "lr": 1.5331010452961673e-06, "epoch": 0.8488421052631578, "percentage": 85.14, "elapsed_time": "11:49:07", "remaining_time": "2:03:48"} |
|
{"current_steps": 253, "total_steps": 296, "loss": 0.3961, "lr": 1.4982578397212545e-06, "epoch": 0.8522105263157894, "percentage": 85.47, "elapsed_time": "11:51:03", "remaining_time": "2:00:51"} |
|
{"current_steps": 254, "total_steps": 296, "loss": 0.3972, "lr": 1.4634146341463414e-06, "epoch": 0.8555789473684211, "percentage": 85.81, "elapsed_time": "11:52:57", "remaining_time": "1:57:53"} |
|
{"current_steps": 255, "total_steps": 296, "loss": 0.4576, "lr": 1.4285714285714286e-06, "epoch": 0.8589473684210527, "percentage": 86.15, "elapsed_time": "11:54:54", "remaining_time": "1:54:56"} |
|
{"current_steps": 255, "total_steps": 296, "eval_loss": 0.43086671829223633, "epoch": 0.8589473684210527, "percentage": 86.15, "elapsed_time": "11:59:50", "remaining_time": "1:55:44"} |
|
{"current_steps": 256, "total_steps": 296, "loss": 0.4499, "lr": 1.3937282229965158e-06, "epoch": 0.8623157894736843, "percentage": 86.49, "elapsed_time": "12:01:41", "remaining_time": "1:52:45"} |
|
{"current_steps": 257, "total_steps": 296, "loss": 0.4615, "lr": 1.3588850174216028e-06, "epoch": 0.8656842105263158, "percentage": 86.82, "elapsed_time": "12:03:30", "remaining_time": "1:49:47"} |
|
{"current_steps": 258, "total_steps": 296, "loss": 0.4738, "lr": 1.32404181184669e-06, "epoch": 0.8690526315789474, "percentage": 87.16, "elapsed_time": "12:05:16", "remaining_time": "1:46:49"} |
|
{"current_steps": 259, "total_steps": 296, "loss": 0.4119, "lr": 1.289198606271777e-06, "epoch": 0.872421052631579, "percentage": 87.5, "elapsed_time": "12:07:01", "remaining_time": "1:43:51"} |
|
{"current_steps": 260, "total_steps": 296, "loss": 0.3921, "lr": 1.2543554006968642e-06, "epoch": 0.8757894736842106, "percentage": 87.84, "elapsed_time": "12:08:45", "remaining_time": "1:40:54"} |
|
{"current_steps": 260, "total_steps": 296, "eval_loss": 0.43330395221710205, "epoch": 0.8757894736842106, "percentage": 87.84, "elapsed_time": "12:13:42", "remaining_time": "1:41:35"} |
|
{"current_steps": 261, "total_steps": 296, "loss": 0.4041, "lr": 1.2195121951219514e-06, "epoch": 0.8791578947368421, "percentage": 88.18, "elapsed_time": "12:15:25", "remaining_time": "1:38:37"} |
|
{"current_steps": 262, "total_steps": 296, "loss": 0.4859, "lr": 1.1846689895470384e-06, "epoch": 0.8825263157894737, "percentage": 88.51, "elapsed_time": "12:17:08", "remaining_time": "1:35:39"} |
|
{"current_steps": 263, "total_steps": 296, "loss": 0.4067, "lr": 1.1498257839721255e-06, "epoch": 0.8858947368421053, "percentage": 88.85, "elapsed_time": "12:18:49", "remaining_time": "1:32:42"} |
|
{"current_steps": 264, "total_steps": 296, "loss": 0.4321, "lr": 1.1149825783972125e-06, "epoch": 0.8892631578947369, "percentage": 89.19, "elapsed_time": "12:20:28", "remaining_time": "1:29:45"} |
|
{"current_steps": 265, "total_steps": 296, "loss": 0.4372, "lr": 1.0801393728222997e-06, "epoch": 0.8926315789473684, "percentage": 89.53, "elapsed_time": "12:22:08", "remaining_time": "1:26:48"} |
|
{"current_steps": 265, "total_steps": 296, "eval_loss": 0.43019115924835205, "epoch": 0.8926315789473684, "percentage": 89.53, "elapsed_time": "12:27:04", "remaining_time": "1:27:23"} |
|
{"current_steps": 266, "total_steps": 296, "loss": 0.4521, "lr": 1.045296167247387e-06, "epoch": 0.896, "percentage": 89.86, "elapsed_time": "12:28:54", "remaining_time": "1:24:27"} |
|
{"current_steps": 267, "total_steps": 296, "loss": 0.4406, "lr": 1.010452961672474e-06, "epoch": 0.8993684210526316, "percentage": 90.2, "elapsed_time": "12:30:46", "remaining_time": "1:21:32"} |
|
{"current_steps": 268, "total_steps": 296, "loss": 0.4209, "lr": 9.75609756097561e-07, "epoch": 0.9027368421052632, "percentage": 90.54, "elapsed_time": "12:32:40", "remaining_time": "1:18:38"} |
|
{"current_steps": 269, "total_steps": 296, "loss": 0.4, "lr": 9.407665505226482e-07, "epoch": 0.9061052631578947, "percentage": 90.88, "elapsed_time": "12:34:30", "remaining_time": "1:15:43"} |
|
{"current_steps": 270, "total_steps": 296, "loss": 0.5449, "lr": 9.059233449477353e-07, "epoch": 0.9094736842105263, "percentage": 91.22, "elapsed_time": "12:36:18", "remaining_time": "1:12:49"} |
|
{"current_steps": 270, "total_steps": 296, "eval_loss": 0.43349674344062805, "epoch": 0.9094736842105263, "percentage": 91.22, "elapsed_time": "12:41:14", "remaining_time": "1:13:18"} |
|
{"current_steps": 271, "total_steps": 296, "loss": 0.3771, "lr": 8.710801393728225e-07, "epoch": 0.9128421052631579, "percentage": 91.55, "elapsed_time": "12:43:01", "remaining_time": "1:10:23"} |
|
{"current_steps": 272, "total_steps": 296, "loss": 0.4439, "lr": 8.362369337979096e-07, "epoch": 0.9162105263157895, "percentage": 91.89, "elapsed_time": "12:44:48", "remaining_time": "1:07:28"} |
|
{"current_steps": 273, "total_steps": 296, "loss": 0.4017, "lr": 8.013937282229965e-07, "epoch": 0.919578947368421, "percentage": 92.23, "elapsed_time": "12:46:36", "remaining_time": "1:04:35"} |
|
{"current_steps": 274, "total_steps": 296, "loss": 0.397, "lr": 7.665505226480836e-07, "epoch": 0.9229473684210526, "percentage": 92.57, "elapsed_time": "12:48:22", "remaining_time": "1:01:41"} |
|
{"current_steps": 275, "total_steps": 296, "loss": 0.4428, "lr": 7.317073170731707e-07, "epoch": 0.9263157894736842, "percentage": 92.91, "elapsed_time": "12:50:15", "remaining_time": "0:58:49"} |
|
{"current_steps": 275, "total_steps": 296, "eval_loss": 0.4311296343803406, "epoch": 0.9263157894736842, "percentage": 92.91, "elapsed_time": "12:55:11", "remaining_time": "0:59:11"} |
|
{"current_steps": 276, "total_steps": 296, "loss": 0.4267, "lr": 6.968641114982579e-07, "epoch": 0.9296842105263158, "percentage": 93.24, "elapsed_time": "12:56:58", "remaining_time": "0:56:18"} |
|
{"current_steps": 277, "total_steps": 296, "loss": 0.4095, "lr": 6.62020905923345e-07, "epoch": 0.9330526315789474, "percentage": 93.58, "elapsed_time": "12:58:43", "remaining_time": "0:53:24"} |
|
{"current_steps": 278, "total_steps": 296, "loss": 0.4512, "lr": 6.271777003484321e-07, "epoch": 0.9364210526315789, "percentage": 93.92, "elapsed_time": "13:00:27", "remaining_time": "0:50:32"} |
|
{"current_steps": 279, "total_steps": 296, "loss": 0.4369, "lr": 5.923344947735192e-07, "epoch": 0.9397894736842105, "percentage": 94.26, "elapsed_time": "13:02:12", "remaining_time": "0:47:39"} |
|
{"current_steps": 280, "total_steps": 296, "loss": 0.4395, "lr": 5.574912891986063e-07, "epoch": 0.9431578947368421, "percentage": 94.59, "elapsed_time": "13:04:01", "remaining_time": "0:44:48"} |
|
{"current_steps": 280, "total_steps": 296, "eval_loss": 0.42866575717926025, "epoch": 0.9431578947368421, "percentage": 94.59, "elapsed_time": "13:08:57", "remaining_time": "0:45:04"} |
|
{"current_steps": 281, "total_steps": 296, "loss": 0.4034, "lr": 5.226480836236935e-07, "epoch": 0.9465263157894737, "percentage": 94.93, "elapsed_time": "13:10:48", "remaining_time": "0:42:12"} |
|
{"current_steps": 282, "total_steps": 296, "loss": 0.4161, "lr": 4.878048780487805e-07, "epoch": 0.9498947368421052, "percentage": 95.27, "elapsed_time": "13:12:34", "remaining_time": "0:39:20"} |
|
{"current_steps": 283, "total_steps": 296, "loss": 0.4248, "lr": 4.5296167247386764e-07, "epoch": 0.9532631578947368, "percentage": 95.61, "elapsed_time": "13:14:15", "remaining_time": "0:36:29"} |
|
{"current_steps": 284, "total_steps": 296, "loss": 0.4205, "lr": 4.181184668989548e-07, "epoch": 0.9566315789473684, "percentage": 95.95, "elapsed_time": "13:16:01", "remaining_time": "0:33:38"} |
|
{"current_steps": 285, "total_steps": 296, "loss": 0.4674, "lr": 3.832752613240418e-07, "epoch": 0.96, "percentage": 96.28, "elapsed_time": "13:17:53", "remaining_time": "0:30:47"} |
|
{"current_steps": 285, "total_steps": 296, "eval_loss": 0.42619824409484863, "epoch": 0.96, "percentage": 96.28, "elapsed_time": "13:22:49", "remaining_time": "0:30:59"} |
|
{"current_steps": 286, "total_steps": 296, "loss": 0.4119, "lr": 3.4843205574912896e-07, "epoch": 0.9633684210526315, "percentage": 96.62, "elapsed_time": "13:24:36", "remaining_time": "0:28:07"} |
|
{"current_steps": 287, "total_steps": 296, "loss": 0.3907, "lr": 3.1358885017421604e-07, "epoch": 0.9667368421052631, "percentage": 96.96, "elapsed_time": "13:26:25", "remaining_time": "0:25:17"} |
|
{"current_steps": 288, "total_steps": 296, "loss": 0.4399, "lr": 2.7874564459930313e-07, "epoch": 0.9701052631578947, "percentage": 97.3, "elapsed_time": "13:28:16", "remaining_time": "0:22:27"} |
|
{"current_steps": 289, "total_steps": 296, "loss": 0.4154, "lr": 2.439024390243903e-07, "epoch": 0.9734736842105263, "percentage": 97.64, "elapsed_time": "13:30:06", "remaining_time": "0:19:37"} |
|
{"current_steps": 290, "total_steps": 296, "loss": 0.4225, "lr": 2.090592334494774e-07, "epoch": 0.9768421052631578, "percentage": 97.97, "elapsed_time": "13:32:00", "remaining_time": "0:16:48"} |
|
{"current_steps": 290, "total_steps": 296, "eval_loss": 0.42567482590675354, "epoch": 0.9768421052631578, "percentage": 97.97, "elapsed_time": "13:36:56", "remaining_time": "0:16:54"} |
|
{"current_steps": 291, "total_steps": 296, "loss": 0.4121, "lr": 1.7421602787456448e-07, "epoch": 0.9802105263157894, "percentage": 98.31, "elapsed_time": "13:38:45", "remaining_time": "0:14:04"} |
|
{"current_steps": 292, "total_steps": 296, "loss": 0.3721, "lr": 1.3937282229965157e-07, "epoch": 0.983578947368421, "percentage": 98.65, "elapsed_time": "13:40:35", "remaining_time": "0:11:14"} |
|
{"current_steps": 293, "total_steps": 296, "loss": 0.4255, "lr": 1.045296167247387e-07, "epoch": 0.9869473684210527, "percentage": 98.99, "elapsed_time": "13:42:23", "remaining_time": "0:08:25"} |
|
{"current_steps": 294, "total_steps": 296, "loss": 0.3859, "lr": 6.968641114982578e-08, "epoch": 0.9903157894736843, "percentage": 99.32, "elapsed_time": "13:44:12", "remaining_time": "0:05:36"} |
|
{"current_steps": 295, "total_steps": 296, "loss": 0.4262, "lr": 3.484320557491289e-08, "epoch": 0.9936842105263158, "percentage": 99.66, "elapsed_time": "13:46:01", "remaining_time": "0:02:48"} |
|
{"current_steps": 295, "total_steps": 296, "eval_loss": 0.4257739186286926, "epoch": 0.9936842105263158, "percentage": 99.66, "elapsed_time": "13:50:57", "remaining_time": "0:02:49"} |
|
{"current_steps": 296, "total_steps": 296, "loss": 0.5187, "lr": 0.0, "epoch": 0.9970526315789474, "percentage": 100.0, "elapsed_time": "13:52:43", "remaining_time": "0:00:00"} |
|
{"current_steps": 296, "total_steps": 296, "epoch": 0.9970526315789474, "percentage": 100.0, "elapsed_time": "13:54:21", "remaining_time": "0:00:00"} |
|
|