PumeTu's picture
Add files using upload-large-folder tool
d1e982f verified
{"current_steps": 1, "total_steps": 132, "loss": 0.9434, "lr": 0.0, "epoch": 0.022988505747126436, "percentage": 0.76, "elapsed_time": "0:03:36", "remaining_time": "7:52:42"}
{"current_steps": 2, "total_steps": 132, "loss": 0.9432, "lr": 1.4285714285714285e-05, "epoch": 0.04597701149425287, "percentage": 1.52, "elapsed_time": "0:07:03", "remaining_time": "7:38:49"}
{"current_steps": 3, "total_steps": 132, "loss": 0.9587, "lr": 2.857142857142857e-05, "epoch": 0.06896551724137931, "percentage": 2.27, "elapsed_time": "0:10:29", "remaining_time": "7:31:29"}
{"current_steps": 4, "total_steps": 132, "loss": 0.9314, "lr": 4.2857142857142856e-05, "epoch": 0.09195402298850575, "percentage": 3.03, "elapsed_time": "0:13:54", "remaining_time": "7:25:03"}
{"current_steps": 5, "total_steps": 132, "loss": 0.921, "lr": 5.714285714285714e-05, "epoch": 0.11494252873563218, "percentage": 3.79, "elapsed_time": "0:17:19", "remaining_time": "7:19:57"}
{"current_steps": 6, "total_steps": 132, "loss": 0.9226, "lr": 7.142857142857143e-05, "epoch": 0.13793103448275862, "percentage": 4.55, "elapsed_time": "0:20:42", "remaining_time": "7:15:00"}
{"current_steps": 7, "total_steps": 132, "loss": 0.9143, "lr": 8.571428571428571e-05, "epoch": 0.16091954022988506, "percentage": 5.3, "elapsed_time": "0:24:08", "remaining_time": "7:11:14"}
{"current_steps": 8, "total_steps": 132, "loss": 0.9042, "lr": 0.0001, "epoch": 0.1839080459770115, "percentage": 6.06, "elapsed_time": "0:27:32", "remaining_time": "7:06:58"}
{"current_steps": 9, "total_steps": 132, "loss": 0.9103, "lr": 0.00011428571428571428, "epoch": 0.20689655172413793, "percentage": 6.82, "elapsed_time": "0:31:00", "remaining_time": "7:03:42"}
{"current_steps": 10, "total_steps": 132, "loss": 0.8865, "lr": 0.00012857142857142858, "epoch": 0.22988505747126436, "percentage": 7.58, "elapsed_time": "0:34:25", "remaining_time": "6:59:59"}
{"current_steps": 10, "total_steps": 132, "eval_loss": 1.0120309591293335, "epoch": 0.22988505747126436, "percentage": 7.58, "elapsed_time": "0:39:32", "remaining_time": "8:02:21"}
{"current_steps": 11, "total_steps": 132, "loss": 0.8673, "lr": 0.00014285714285714287, "epoch": 0.25287356321839083, "percentage": 8.33, "elapsed_time": "0:42:59", "remaining_time": "7:52:51"}
{"current_steps": 12, "total_steps": 132, "loss": 0.8573, "lr": 0.00015714285714285716, "epoch": 0.27586206896551724, "percentage": 9.09, "elapsed_time": "0:46:24", "remaining_time": "7:44:04"}
{"current_steps": 13, "total_steps": 132, "loss": 0.8505, "lr": 0.00017142857142857143, "epoch": 0.2988505747126437, "percentage": 9.85, "elapsed_time": "0:49:49", "remaining_time": "7:36:05"}
{"current_steps": 14, "total_steps": 132, "loss": 0.8385, "lr": 0.00018571428571428572, "epoch": 0.3218390804597701, "percentage": 10.61, "elapsed_time": "0:53:14", "remaining_time": "7:28:44"}
{"current_steps": 15, "total_steps": 132, "loss": 0.8163, "lr": 0.0002, "epoch": 0.3448275862068966, "percentage": 11.36, "elapsed_time": "0:56:39", "remaining_time": "7:21:59"}
{"current_steps": 16, "total_steps": 132, "loss": 0.7976, "lr": 0.00019996456111234527, "epoch": 0.367816091954023, "percentage": 12.12, "elapsed_time": "1:00:03", "remaining_time": "7:15:22"}
{"current_steps": 17, "total_steps": 132, "loss": 0.805, "lr": 0.0001998582695676762, "epoch": 0.39080459770114945, "percentage": 12.88, "elapsed_time": "1:03:26", "remaining_time": "7:09:11"}
{"current_steps": 18, "total_steps": 132, "loss": 0.7909, "lr": 0.000199681200703075, "epoch": 0.41379310344827586, "percentage": 13.64, "elapsed_time": "1:06:52", "remaining_time": "7:03:30"}
{"current_steps": 19, "total_steps": 132, "loss": 0.7971, "lr": 0.00019943348002101371, "epoch": 0.4367816091954023, "percentage": 14.39, "elapsed_time": "1:10:17", "remaining_time": "6:58:04"}
{"current_steps": 20, "total_steps": 132, "loss": 0.7698, "lr": 0.00019911528310040074, "epoch": 0.45977011494252873, "percentage": 15.15, "elapsed_time": "1:13:43", "remaining_time": "6:52:50"}
{"current_steps": 20, "total_steps": 132, "eval_loss": 0.8262545466423035, "epoch": 0.45977011494252873, "percentage": 15.15, "elapsed_time": "1:18:47", "remaining_time": "7:21:14"}
{"current_steps": 21, "total_steps": 132, "loss": 0.7775, "lr": 0.00019872683547213446, "epoch": 0.4827586206896552, "percentage": 15.91, "elapsed_time": "1:22:12", "remaining_time": "7:14:32"}
{"current_steps": 22, "total_steps": 132, "loss": 0.7671, "lr": 0.00019826841245925212, "epoch": 0.5057471264367817, "percentage": 16.67, "elapsed_time": "1:25:37", "remaining_time": "7:08:09"}
{"current_steps": 23, "total_steps": 132, "loss": 0.7575, "lr": 0.00019774033898178667, "epoch": 0.5287356321839081, "percentage": 17.42, "elapsed_time": "1:29:01", "remaining_time": "7:01:55"}
{"current_steps": 24, "total_steps": 132, "loss": 0.7454, "lr": 0.00019714298932647098, "epoch": 0.5517241379310345, "percentage": 18.18, "elapsed_time": "1:32:24", "remaining_time": "6:55:51"}
{"current_steps": 25, "total_steps": 132, "loss": 0.7456, "lr": 0.0001964767868814516, "epoch": 0.5747126436781609, "percentage": 18.94, "elapsed_time": "1:35:48", "remaining_time": "6:50:03"}
{"current_steps": 26, "total_steps": 132, "loss": 0.7314, "lr": 0.00019574220383620055, "epoch": 0.5977011494252874, "percentage": 19.7, "elapsed_time": "1:39:12", "remaining_time": "6:44:27"}
{"current_steps": 27, "total_steps": 132, "loss": 0.7148, "lr": 0.00019493976084683813, "epoch": 0.6206896551724138, "percentage": 20.45, "elapsed_time": "1:42:36", "remaining_time": "6:39:00"}
{"current_steps": 28, "total_steps": 132, "loss": 0.7409, "lr": 0.00019407002666710336, "epoch": 0.6436781609195402, "percentage": 21.21, "elapsed_time": "1:45:59", "remaining_time": "6:33:41"}
{"current_steps": 29, "total_steps": 132, "loss": 0.7213, "lr": 0.00019313361774523385, "epoch": 0.6666666666666666, "percentage": 21.97, "elapsed_time": "1:49:24", "remaining_time": "6:28:34"}
{"current_steps": 30, "total_steps": 132, "loss": 0.7376, "lr": 0.00019213119778704128, "epoch": 0.6896551724137931, "percentage": 22.73, "elapsed_time": "1:52:49", "remaining_time": "6:23:37"}
{"current_steps": 30, "total_steps": 132, "eval_loss": 0.732206404209137, "epoch": 0.6896551724137931, "percentage": 22.73, "elapsed_time": "1:57:53", "remaining_time": "6:40:50"}
{"current_steps": 31, "total_steps": 132, "loss": 0.7336, "lr": 0.00019106347728549135, "epoch": 0.7126436781609196, "percentage": 23.48, "elapsed_time": "2:01:15", "remaining_time": "6:35:05"}
{"current_steps": 32, "total_steps": 132, "loss": 0.7253, "lr": 0.00018993121301712193, "epoch": 0.735632183908046, "percentage": 24.24, "elapsed_time": "2:04:40", "remaining_time": "6:29:36"}
{"current_steps": 33, "total_steps": 132, "loss": 0.7232, "lr": 0.00018873520750565718, "epoch": 0.7586206896551724, "percentage": 25.0, "elapsed_time": "2:08:04", "remaining_time": "6:24:13"}
{"current_steps": 34, "total_steps": 132, "loss": 0.727, "lr": 0.00018747630845319612, "epoch": 0.7816091954022989, "percentage": 25.76, "elapsed_time": "2:11:30", "remaining_time": "6:19:02"}
{"current_steps": 35, "total_steps": 132, "loss": 0.7152, "lr": 0.0001861554081393806, "epoch": 0.8045977011494253, "percentage": 26.52, "elapsed_time": "2:14:54", "remaining_time": "6:13:52"}
{"current_steps": 36, "total_steps": 132, "loss": 0.7059, "lr": 0.0001847734427889671, "epoch": 0.8275862068965517, "percentage": 27.27, "elapsed_time": "2:18:16", "remaining_time": "6:08:44"}
{"current_steps": 37, "total_steps": 132, "loss": 0.7202, "lr": 0.0001833313919082515, "epoch": 0.8505747126436781, "percentage": 28.03, "elapsed_time": "2:21:40", "remaining_time": "6:03:44"}
{"current_steps": 38, "total_steps": 132, "loss": 0.7033, "lr": 0.0001818302775908169, "epoch": 0.8735632183908046, "percentage": 28.79, "elapsed_time": "2:25:03", "remaining_time": "5:58:50"}
{"current_steps": 39, "total_steps": 132, "loss": 0.7127, "lr": 0.00018027116379309638, "epoch": 0.896551724137931, "percentage": 29.55, "elapsed_time": "2:28:26", "remaining_time": "5:53:59"}
{"current_steps": 40, "total_steps": 132, "loss": 0.7202, "lr": 0.00017865515558026428, "epoch": 0.9195402298850575, "percentage": 30.3, "elapsed_time": "2:31:50", "remaining_time": "5:49:13"}
{"current_steps": 40, "total_steps": 132, "eval_loss": 0.709326446056366, "epoch": 0.9195402298850575, "percentage": 30.3, "elapsed_time": "2:36:55", "remaining_time": "6:00:56"}
{"current_steps": 41, "total_steps": 132, "loss": 0.7075, "lr": 0.00017698339834299061, "epoch": 0.9425287356321839, "percentage": 31.06, "elapsed_time": "2:40:20", "remaining_time": "5:55:52"}
{"current_steps": 42, "total_steps": 132, "loss": 0.6974, "lr": 0.00017525707698561385, "epoch": 0.9655172413793104, "percentage": 31.82, "elapsed_time": "2:43:44", "remaining_time": "5:50:52"}
{"current_steps": 43, "total_steps": 132, "loss": 0.7148, "lr": 0.00017347741508630672, "epoch": 0.9885057471264368, "percentage": 32.58, "elapsed_time": "2:47:09", "remaining_time": "5:45:59"}
{"current_steps": 44, "total_steps": 132, "loss": 0.716, "lr": 0.00017164567402983152, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "2:48:55", "remaining_time": "5:37:50"}
{"current_steps": 45, "total_steps": 132, "loss": 0.696, "lr": 0.0001697631521134985, "epoch": 1.0229885057471264, "percentage": 34.09, "elapsed_time": "2:52:20", "remaining_time": "5:33:12"}
{"current_steps": 46, "total_steps": 132, "loss": 0.6967, "lr": 0.00016783118362696163, "epoch": 1.0459770114942528, "percentage": 34.85, "elapsed_time": "2:55:44", "remaining_time": "5:28:34"}
{"current_steps": 47, "total_steps": 132, "loss": 0.6977, "lr": 0.00016585113790650388, "epoch": 1.0689655172413792, "percentage": 35.61, "elapsed_time": "2:59:08", "remaining_time": "5:23:59"}
{"current_steps": 48, "total_steps": 132, "loss": 0.6856, "lr": 0.00016382441836448202, "epoch": 1.0919540229885056, "percentage": 36.36, "elapsed_time": "3:02:33", "remaining_time": "5:19:27"}
{"current_steps": 49, "total_steps": 132, "loss": 0.6991, "lr": 0.0001617524614946192, "epoch": 1.1149425287356323, "percentage": 37.12, "elapsed_time": "3:05:58", "remaining_time": "5:15:00"}
{"current_steps": 50, "total_steps": 132, "loss": 0.6826, "lr": 0.00015963673585385016, "epoch": 1.1379310344827587, "percentage": 37.88, "elapsed_time": "3:09:23", "remaining_time": "5:10:35"}
{"current_steps": 50, "total_steps": 132, "eval_loss": 0.6974772214889526, "epoch": 1.1379310344827587, "percentage": 37.88, "elapsed_time": "3:14:28", "remaining_time": "5:18:55"}
{"current_steps": 51, "total_steps": 132, "loss": 0.6958, "lr": 0.0001574787410214407, "epoch": 1.160919540229885, "percentage": 38.64, "elapsed_time": "3:18:13", "remaining_time": "5:14:49"}
{"current_steps": 52, "total_steps": 132, "loss": 0.6889, "lr": 0.00015528000653611935, "epoch": 1.1839080459770115, "percentage": 39.39, "elapsed_time": "3:21:42", "remaining_time": "5:10:18"}
{"current_steps": 53, "total_steps": 132, "loss": 0.6709, "lr": 0.00015304209081197425, "epoch": 1.206896551724138, "percentage": 40.15, "elapsed_time": "3:25:06", "remaining_time": "5:05:44"}
{"current_steps": 54, "total_steps": 132, "loss": 0.6841, "lr": 0.000150766580033884, "epoch": 1.2298850574712643, "percentage": 40.91, "elapsed_time": "3:28:33", "remaining_time": "5:01:14"}
{"current_steps": 55, "total_steps": 132, "loss": 0.6971, "lr": 0.00014845508703326504, "epoch": 1.2528735632183907, "percentage": 41.67, "elapsed_time": "3:31:57", "remaining_time": "4:56:44"}
{"current_steps": 56, "total_steps": 132, "loss": 0.6815, "lr": 0.0001461092501449326, "epoch": 1.2758620689655173, "percentage": 42.42, "elapsed_time": "3:35:22", "remaining_time": "4:52:17"}
{"current_steps": 57, "total_steps": 132, "loss": 0.6829, "lr": 0.00014373073204588556, "epoch": 1.2988505747126438, "percentage": 43.18, "elapsed_time": "3:38:45", "remaining_time": "4:47:50"}
{"current_steps": 58, "total_steps": 132, "loss": 0.6788, "lr": 0.00014132121857683783, "epoch": 1.3218390804597702, "percentage": 43.94, "elapsed_time": "3:42:13", "remaining_time": "4:43:31"}
{"current_steps": 59, "total_steps": 132, "loss": 0.6867, "lr": 0.00013888241754733208, "epoch": 1.3448275862068966, "percentage": 44.7, "elapsed_time": "3:45:37", "remaining_time": "4:39:09"}
{"current_steps": 60, "total_steps": 132, "loss": 0.6718, "lr": 0.00013641605752528224, "epoch": 1.367816091954023, "percentage": 45.45, "elapsed_time": "3:49:01", "remaining_time": "4:34:50"}
{"current_steps": 60, "total_steps": 132, "eval_loss": 0.6893976926803589, "epoch": 1.367816091954023, "percentage": 45.45, "elapsed_time": "3:54:07", "remaining_time": "4:40:56"}
{"current_steps": 61, "total_steps": 132, "loss": 0.6663, "lr": 0.00013392388661180303, "epoch": 1.3908045977011494, "percentage": 46.21, "elapsed_time": "3:57:31", "remaining_time": "4:36:28"}
{"current_steps": 62, "total_steps": 132, "loss": 0.6805, "lr": 0.0001314076712021949, "epoch": 1.4137931034482758, "percentage": 46.97, "elapsed_time": "4:00:57", "remaining_time": "4:32:03"}
{"current_steps": 63, "total_steps": 132, "loss": 0.6965, "lr": 0.0001288691947339621, "epoch": 1.4367816091954024, "percentage": 47.73, "elapsed_time": "4:04:20", "remaining_time": "4:27:36"}
{"current_steps": 64, "total_steps": 132, "loss": 0.6665, "lr": 0.00012631025642275212, "epoch": 1.4597701149425286, "percentage": 48.48, "elapsed_time": "4:07:45", "remaining_time": "4:23:14"}
{"current_steps": 65, "total_steps": 132, "loss": 0.6782, "lr": 0.0001237326699871115, "epoch": 1.4827586206896552, "percentage": 49.24, "elapsed_time": "4:11:10", "remaining_time": "4:18:53"}
{"current_steps": 66, "total_steps": 132, "loss": 0.681, "lr": 0.00012113826236296244, "epoch": 1.5057471264367817, "percentage": 50.0, "elapsed_time": "4:14:34", "remaining_time": "4:14:34"}
{"current_steps": 67, "total_steps": 132, "loss": 0.6584, "lr": 0.00011852887240871145, "epoch": 1.528735632183908, "percentage": 50.76, "elapsed_time": "4:17:59", "remaining_time": "4:10:17"}
{"current_steps": 68, "total_steps": 132, "loss": 0.6917, "lr": 0.00011590634960190721, "epoch": 1.5517241379310345, "percentage": 51.52, "elapsed_time": "4:21:25", "remaining_time": "4:06:02"}
{"current_steps": 69, "total_steps": 132, "loss": 0.6786, "lr": 0.00011327255272837221, "epoch": 1.5747126436781609, "percentage": 52.27, "elapsed_time": "4:24:52", "remaining_time": "4:01:50"}
{"current_steps": 70, "total_steps": 132, "loss": 0.6726, "lr": 0.00011062934856473655, "epoch": 1.5977011494252875, "percentage": 53.03, "elapsed_time": "4:28:17", "remaining_time": "3:57:37"}
{"current_steps": 70, "total_steps": 132, "eval_loss": 0.6833033561706543, "epoch": 1.5977011494252875, "percentage": 53.03, "elapsed_time": "4:33:22", "remaining_time": "4:02:07"}
{"current_steps": 71, "total_steps": 132, "loss": 0.6741, "lr": 0.00010797861055530831, "epoch": 1.6206896551724137, "percentage": 53.79, "elapsed_time": "4:36:46", "remaining_time": "3:57:47"}
{"current_steps": 72, "total_steps": 132, "loss": 0.6622, "lr": 0.00010532221748421787, "epoch": 1.6436781609195403, "percentage": 54.55, "elapsed_time": "4:40:09", "remaining_time": "3:53:28"}
{"current_steps": 73, "total_steps": 132, "loss": 0.6839, "lr": 0.00010266205214377748, "epoch": 1.6666666666666665, "percentage": 55.3, "elapsed_time": "4:43:35", "remaining_time": "3:49:11"}
{"current_steps": 74, "total_steps": 132, "loss": 0.6843, "lr": 0.0001, "epoch": 1.6896551724137931, "percentage": 56.06, "elapsed_time": "4:46:59", "remaining_time": "3:44:56"}
{"current_steps": 75, "total_steps": 132, "loss": 0.6902, "lr": 9.733794785622253e-05, "epoch": 1.7126436781609196, "percentage": 56.82, "elapsed_time": "4:50:22", "remaining_time": "3:40:41"}
{"current_steps": 76, "total_steps": 132, "loss": 0.67, "lr": 9.467778251578217e-05, "epoch": 1.735632183908046, "percentage": 57.58, "elapsed_time": "4:53:46", "remaining_time": "3:36:28"}
{"current_steps": 77, "total_steps": 132, "loss": 0.6688, "lr": 9.202138944469168e-05, "epoch": 1.7586206896551724, "percentage": 58.33, "elapsed_time": "4:57:14", "remaining_time": "3:32:18"}
{"current_steps": 78, "total_steps": 132, "loss": 0.6744, "lr": 8.937065143526347e-05, "epoch": 1.7816091954022988, "percentage": 59.09, "elapsed_time": "5:00:38", "remaining_time": "3:28:08"}
{"current_steps": 79, "total_steps": 132, "loss": 0.6766, "lr": 8.672744727162781e-05, "epoch": 1.8045977011494254, "percentage": 59.85, "elapsed_time": "5:04:03", "remaining_time": "3:23:59"}
{"current_steps": 80, "total_steps": 132, "loss": 0.6683, "lr": 8.409365039809281e-05, "epoch": 1.8275862068965516, "percentage": 60.61, "elapsed_time": "5:07:28", "remaining_time": "3:19:51"}
{"current_steps": 80, "total_steps": 132, "eval_loss": 0.6785663962364197, "epoch": 1.8275862068965516, "percentage": 60.61, "elapsed_time": "5:12:33", "remaining_time": "3:23:09"}
{"current_steps": 81, "total_steps": 132, "loss": 0.6665, "lr": 8.147112759128859e-05, "epoch": 1.8505747126436782, "percentage": 61.36, "elapsed_time": "5:15:59", "remaining_time": "3:18:57"}
{"current_steps": 82, "total_steps": 132, "loss": 0.6651, "lr": 7.886173763703757e-05, "epoch": 1.8735632183908046, "percentage": 62.12, "elapsed_time": "5:19:24", "remaining_time": "3:14:45"}
{"current_steps": 83, "total_steps": 132, "loss": 0.6578, "lr": 7.626733001288851e-05, "epoch": 1.896551724137931, "percentage": 62.88, "elapsed_time": "5:22:48", "remaining_time": "3:10:34"}
{"current_steps": 84, "total_steps": 132, "loss": 0.6689, "lr": 7.368974357724789e-05, "epoch": 1.9195402298850575, "percentage": 63.64, "elapsed_time": "5:26:14", "remaining_time": "3:06:25"}
{"current_steps": 85, "total_steps": 132, "loss": 0.676, "lr": 7.113080526603792e-05, "epoch": 1.9425287356321839, "percentage": 64.39, "elapsed_time": "5:29:39", "remaining_time": "3:02:16"}
{"current_steps": 86, "total_steps": 132, "loss": 0.6514, "lr": 6.859232879780515e-05, "epoch": 1.9655172413793105, "percentage": 65.15, "elapsed_time": "5:33:02", "remaining_time": "2:58:08"}
{"current_steps": 87, "total_steps": 132, "loss": 0.6728, "lr": 6.607611338819697e-05, "epoch": 1.9885057471264367, "percentage": 65.91, "elapsed_time": "5:36:26", "remaining_time": "2:54:01"}
{"current_steps": 88, "total_steps": 132, "loss": 0.677, "lr": 6.358394247471778e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "5:38:12", "remaining_time": "2:49:06"}
{"current_steps": 89, "total_steps": 132, "loss": 0.6688, "lr": 6.111758245266794e-05, "epoch": 2.0229885057471266, "percentage": 67.42, "elapsed_time": "5:41:36", "remaining_time": "2:45:03"}
{"current_steps": 90, "total_steps": 132, "loss": 0.6532, "lr": 5.867878142316221e-05, "epoch": 2.045977011494253, "percentage": 68.18, "elapsed_time": "5:45:03", "remaining_time": "2:41:01"}
{"current_steps": 90, "total_steps": 132, "eval_loss": 0.6744519472122192, "epoch": 2.045977011494253, "percentage": 68.18, "elapsed_time": "5:50:07", "remaining_time": "2:43:23"}
{"current_steps": 91, "total_steps": 132, "loss": 0.6624, "lr": 5.626926795411447e-05, "epoch": 2.0689655172413794, "percentage": 68.94, "elapsed_time": "5:53:32", "remaining_time": "2:39:17"}
{"current_steps": 92, "total_steps": 132, "loss": 0.6688, "lr": 5.38907498550674e-05, "epoch": 2.0919540229885056, "percentage": 69.7, "elapsed_time": "5:56:56", "remaining_time": "2:35:11"}
{"current_steps": 93, "total_steps": 132, "loss": 0.6733, "lr": 5.1544912966734994e-05, "epoch": 2.1149425287356323, "percentage": 70.45, "elapsed_time": "6:00:21", "remaining_time": "2:31:07"}
{"current_steps": 94, "total_steps": 132, "loss": 0.6558, "lr": 4.9233419966116036e-05, "epoch": 2.1379310344827585, "percentage": 71.21, "elapsed_time": "6:03:46", "remaining_time": "2:27:03"}
{"current_steps": 95, "total_steps": 132, "loss": 0.6491, "lr": 4.695790918802576e-05, "epoch": 2.160919540229885, "percentage": 71.97, "elapsed_time": "6:07:11", "remaining_time": "2:23:00"}
{"current_steps": 96, "total_steps": 132, "loss": 0.6781, "lr": 4.47199934638807e-05, "epoch": 2.1839080459770113, "percentage": 72.73, "elapsed_time": "6:10:37", "remaining_time": "2:18:59"}
{"current_steps": 97, "total_steps": 132, "loss": 0.6603, "lr": 4.252125897855932e-05, "epoch": 2.206896551724138, "percentage": 73.48, "elapsed_time": "6:14:01", "remaining_time": "2:14:57"}
{"current_steps": 98, "total_steps": 132, "loss": 0.6511, "lr": 4.036326414614985e-05, "epoch": 2.2298850574712645, "percentage": 74.24, "elapsed_time": "6:17:26", "remaining_time": "2:10:57"}
{"current_steps": 99, "total_steps": 132, "loss": 0.6646, "lr": 3.824753850538082e-05, "epoch": 2.2528735632183907, "percentage": 75.0, "elapsed_time": "6:20:52", "remaining_time": "2:06:57"}
{"current_steps": 100, "total_steps": 132, "loss": 0.6622, "lr": 3.617558163551802e-05, "epoch": 2.2758620689655173, "percentage": 75.76, "elapsed_time": "6:24:17", "remaining_time": "2:02:58"}
{"current_steps": 100, "total_steps": 132, "eval_loss": 0.6719217300415039, "epoch": 2.2758620689655173, "percentage": 75.76, "elapsed_time": "6:29:23", "remaining_time": "2:04:36"}
{"current_steps": 101, "total_steps": 132, "loss": 0.6514, "lr": 3.414886209349615e-05, "epoch": 2.2988505747126435, "percentage": 76.52, "elapsed_time": "6:33:08", "remaining_time": "2:00:40"}
{"current_steps": 102, "total_steps": 132, "loss": 0.6555, "lr": 3.216881637303839e-05, "epoch": 2.32183908045977, "percentage": 77.27, "elapsed_time": "6:36:33", "remaining_time": "1:56:37"}
{"current_steps": 103, "total_steps": 132, "loss": 0.6613, "lr": 3.0236847886501542e-05, "epoch": 2.344827586206897, "percentage": 78.03, "elapsed_time": "6:39:57", "remaining_time": "1:52:36"}
{"current_steps": 104, "total_steps": 132, "loss": 0.6471, "lr": 2.8354325970168484e-05, "epoch": 2.367816091954023, "percentage": 78.79, "elapsed_time": "6:43:25", "remaining_time": "1:48:36"}
{"current_steps": 105, "total_steps": 132, "loss": 0.646, "lr": 2.6522584913693294e-05, "epoch": 2.3908045977011496, "percentage": 79.55, "elapsed_time": "6:46:49", "remaining_time": "1:44:36"}
{"current_steps": 106, "total_steps": 132, "loss": 0.6546, "lr": 2.4742923014386156e-05, "epoch": 2.413793103448276, "percentage": 80.3, "elapsed_time": "6:50:15", "remaining_time": "1:40:37"}
{"current_steps": 107, "total_steps": 132, "loss": 0.6588, "lr": 2.301660165700936e-05, "epoch": 2.4367816091954024, "percentage": 81.06, "elapsed_time": "6:53:39", "remaining_time": "1:36:38"}
{"current_steps": 108, "total_steps": 132, "loss": 0.6473, "lr": 2.1344844419735755e-05, "epoch": 2.4597701149425286, "percentage": 81.82, "elapsed_time": "6:57:02", "remaining_time": "1:32:40"}
{"current_steps": 109, "total_steps": 132, "loss": 0.6528, "lr": 1.9728836206903656e-05, "epoch": 2.4827586206896552, "percentage": 82.58, "elapsed_time": "7:00:26", "remaining_time": "1:28:43"}
{"current_steps": 110, "total_steps": 132, "loss": 0.6476, "lr": 1.8169722409183097e-05, "epoch": 2.5057471264367814, "percentage": 83.33, "elapsed_time": "7:03:53", "remaining_time": "1:24:46"}
{"current_steps": 110, "total_steps": 132, "eval_loss": 0.6705266237258911, "epoch": 2.5057471264367814, "percentage": 83.33, "elapsed_time": "7:08:58", "remaining_time": "1:25:47"}
{"current_steps": 111, "total_steps": 132, "loss": 0.6563, "lr": 1.6668608091748495e-05, "epoch": 2.528735632183908, "percentage": 84.09, "elapsed_time": "7:12:26", "remaining_time": "1:21:48"}
{"current_steps": 112, "total_steps": 132, "loss": 0.6458, "lr": 1.522655721103291e-05, "epoch": 2.5517241379310347, "percentage": 84.85, "elapsed_time": "7:15:53", "remaining_time": "1:17:50"}
{"current_steps": 113, "total_steps": 132, "loss": 0.6541, "lr": 1.3844591860619383e-05, "epoch": 2.574712643678161, "percentage": 85.61, "elapsed_time": "7:19:17", "remaining_time": "1:13:51"}
{"current_steps": 114, "total_steps": 132, "loss": 0.6475, "lr": 1.2523691546803873e-05, "epoch": 2.5977011494252875, "percentage": 86.36, "elapsed_time": "7:22:41", "remaining_time": "1:09:53"}
{"current_steps": 115, "total_steps": 132, "loss": 0.6705, "lr": 1.1264792494342857e-05, "epoch": 2.6206896551724137, "percentage": 87.12, "elapsed_time": "7:26:06", "remaining_time": "1:05:56"}
{"current_steps": 116, "total_steps": 132, "loss": 0.6422, "lr": 1.0068786982878087e-05, "epoch": 2.6436781609195403, "percentage": 87.88, "elapsed_time": "7:29:29", "remaining_time": "1:01:59"}
{"current_steps": 117, "total_steps": 132, "loss": 0.6622, "lr": 8.936522714508678e-06, "epoch": 2.6666666666666665, "percentage": 88.64, "elapsed_time": "7:32:52", "remaining_time": "0:58:03"}
{"current_steps": 118, "total_steps": 132, "loss": 0.6529, "lr": 7.868802212958703e-06, "epoch": 2.689655172413793, "percentage": 89.39, "elapsed_time": "7:36:16", "remaining_time": "0:54:08"}
{"current_steps": 119, "total_steps": 132, "loss": 0.6558, "lr": 6.866382254766157e-06, "epoch": 2.7126436781609193, "percentage": 90.15, "elapsed_time": "7:39:40", "remaining_time": "0:50:12"}
{"current_steps": 120, "total_steps": 132, "loss": 0.6399, "lr": 5.929973332896677e-06, "epoch": 2.735632183908046, "percentage": 90.91, "elapsed_time": "7:43:05", "remaining_time": "0:46:18"}
{"current_steps": 120, "total_steps": 132, "eval_loss": 0.6699749231338501, "epoch": 2.735632183908046, "percentage": 90.91, "elapsed_time": "7:48:08", "remaining_time": "0:46:48"}
{"current_steps": 121, "total_steps": 132, "loss": 0.6566, "lr": 5.060239153161872e-06, "epoch": 2.7586206896551726, "percentage": 91.67, "elapsed_time": "7:51:32", "remaining_time": "0:42:52"}
{"current_steps": 122, "total_steps": 132, "loss": 0.6564, "lr": 4.257796163799455e-06, "epoch": 2.781609195402299, "percentage": 92.42, "elapsed_time": "7:54:57", "remaining_time": "0:38:55"}
{"current_steps": 123, "total_steps": 132, "loss": 0.6487, "lr": 3.5232131185484076e-06, "epoch": 2.8045977011494254, "percentage": 93.18, "elapsed_time": "7:58:24", "remaining_time": "0:35:00"}
{"current_steps": 124, "total_steps": 132, "loss": 0.6394, "lr": 2.857010673529015e-06, "epoch": 2.8275862068965516, "percentage": 93.94, "elapsed_time": "8:01:48", "remaining_time": "0:31:05"}
{"current_steps": 125, "total_steps": 132, "loss": 0.6562, "lr": 2.259661018213333e-06, "epoch": 2.8505747126436782, "percentage": 94.7, "elapsed_time": "8:05:10", "remaining_time": "0:27:10"}
{"current_steps": 126, "total_steps": 132, "loss": 0.6446, "lr": 1.7315875407479032e-06, "epoch": 2.873563218390805, "percentage": 95.45, "elapsed_time": "8:08:33", "remaining_time": "0:23:15"}
{"current_steps": 127, "total_steps": 132, "loss": 0.6519, "lr": 1.2731645278655445e-06, "epoch": 2.896551724137931, "percentage": 96.21, "elapsed_time": "8:11:57", "remaining_time": "0:19:22"}
{"current_steps": 128, "total_steps": 132, "loss": 0.652, "lr": 8.847168995992916e-07, "epoch": 2.9195402298850572, "percentage": 96.97, "elapsed_time": "8:15:21", "remaining_time": "0:15:28"}
{"current_steps": 129, "total_steps": 132, "loss": 0.647, "lr": 5.665199789862907e-07, "epoch": 2.942528735632184, "percentage": 97.73, "elapsed_time": "8:18:43", "remaining_time": "0:11:35"}
{"current_steps": 130, "total_steps": 132, "loss": 0.643, "lr": 3.1879929692498757e-07, "epoch": 2.9655172413793105, "percentage": 98.48, "elapsed_time": "8:22:07", "remaining_time": "0:07:43"}
{"current_steps": 130, "total_steps": 132, "eval_loss": 0.6699010729789734, "epoch": 2.9655172413793105, "percentage": 98.48, "elapsed_time": "8:27:08", "remaining_time": "0:07:48"}
{"current_steps": 131, "total_steps": 132, "loss": 0.6597, "lr": 1.4173043232380557e-07, "epoch": 2.9885057471264367, "percentage": 99.24, "elapsed_time": "8:30:30", "remaining_time": "0:03:53"}
{"current_steps": 132, "total_steps": 132, "loss": 0.6579, "lr": 3.5438887654737355e-08, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "8:32:14", "remaining_time": "0:00:00"}
{"current_steps": 132, "total_steps": 132, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "8:32:34", "remaining_time": "0:00:00"}