top_11_ranking_stackexchange / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
d2963ab verified
{"current_steps": 10, "total_steps": 1203, "loss": 1.0469, "lr": 5e-06, "epoch": 0.024906600249066, "percentage": 0.83, "elapsed_time": "0:09:40", "remaining_time": "19:14:27"}
{"current_steps": 20, "total_steps": 1203, "loss": 0.9485, "lr": 5e-06, "epoch": 0.049813200498132, "percentage": 1.66, "elapsed_time": "0:19:16", "remaining_time": "19:00:08"}
{"current_steps": 30, "total_steps": 1203, "loss": 0.9118, "lr": 5e-06, "epoch": 0.074719800747198, "percentage": 2.49, "elapsed_time": "0:28:52", "remaining_time": "18:49:04"}
{"current_steps": 40, "total_steps": 1203, "loss": 0.896, "lr": 5e-06, "epoch": 0.099626400996264, "percentage": 3.33, "elapsed_time": "0:38:28", "remaining_time": "18:38:38"}
{"current_steps": 50, "total_steps": 1203, "loss": 0.885, "lr": 5e-06, "epoch": 0.12453300124533001, "percentage": 4.16, "elapsed_time": "0:48:04", "remaining_time": "18:28:45"}
{"current_steps": 60, "total_steps": 1203, "loss": 0.8743, "lr": 5e-06, "epoch": 0.149439601494396, "percentage": 4.99, "elapsed_time": "0:57:40", "remaining_time": "18:18:45"}
{"current_steps": 70, "total_steps": 1203, "loss": 0.865, "lr": 5e-06, "epoch": 0.17434620174346202, "percentage": 5.82, "elapsed_time": "1:07:17", "remaining_time": "18:09:04"}
{"current_steps": 80, "total_steps": 1203, "loss": 0.8637, "lr": 5e-06, "epoch": 0.199252801992528, "percentage": 6.65, "elapsed_time": "1:16:52", "remaining_time": "17:59:11"}
{"current_steps": 90, "total_steps": 1203, "loss": 0.8538, "lr": 5e-06, "epoch": 0.22415940224159403, "percentage": 7.48, "elapsed_time": "1:26:27", "remaining_time": "17:49:18"}
{"current_steps": 100, "total_steps": 1203, "loss": 0.8462, "lr": 5e-06, "epoch": 0.24906600249066002, "percentage": 8.31, "elapsed_time": "1:36:02", "remaining_time": "17:39:22"}
{"current_steps": 110, "total_steps": 1203, "loss": 0.8516, "lr": 5e-06, "epoch": 0.273972602739726, "percentage": 9.14, "elapsed_time": "1:45:38", "remaining_time": "17:29:38"}
{"current_steps": 120, "total_steps": 1203, "loss": 0.8424, "lr": 5e-06, "epoch": 0.298879202988792, "percentage": 9.98, "elapsed_time": "1:55:13", "remaining_time": "17:19:53"}
{"current_steps": 130, "total_steps": 1203, "loss": 0.838, "lr": 5e-06, "epoch": 0.32378580323785805, "percentage": 10.81, "elapsed_time": "2:04:47", "remaining_time": "17:10:04"}
{"current_steps": 140, "total_steps": 1203, "loss": 0.8425, "lr": 5e-06, "epoch": 0.34869240348692404, "percentage": 11.64, "elapsed_time": "2:14:23", "remaining_time": "17:00:26"}
{"current_steps": 150, "total_steps": 1203, "loss": 0.8394, "lr": 5e-06, "epoch": 0.37359900373599003, "percentage": 12.47, "elapsed_time": "2:23:59", "remaining_time": "16:50:52"}
{"current_steps": 160, "total_steps": 1203, "loss": 0.8331, "lr": 5e-06, "epoch": 0.398505603985056, "percentage": 13.3, "elapsed_time": "2:33:36", "remaining_time": "16:41:17"}
{"current_steps": 170, "total_steps": 1203, "loss": 0.8326, "lr": 5e-06, "epoch": 0.42341220423412207, "percentage": 14.13, "elapsed_time": "2:43:11", "remaining_time": "16:31:38"}
{"current_steps": 180, "total_steps": 1203, "loss": 0.8279, "lr": 5e-06, "epoch": 0.44831880448318806, "percentage": 14.96, "elapsed_time": "2:52:47", "remaining_time": "16:22:02"}
{"current_steps": 190, "total_steps": 1203, "loss": 0.8289, "lr": 5e-06, "epoch": 0.47322540473225405, "percentage": 15.79, "elapsed_time": "3:02:23", "remaining_time": "16:12:28"}
{"current_steps": 200, "total_steps": 1203, "loss": 0.8269, "lr": 5e-06, "epoch": 0.49813200498132004, "percentage": 16.63, "elapsed_time": "3:11:59", "remaining_time": "16:02:50"}
{"current_steps": 210, "total_steps": 1203, "loss": 0.827, "lr": 5e-06, "epoch": 0.523038605230386, "percentage": 17.46, "elapsed_time": "3:21:35", "remaining_time": "15:53:14"}
{"current_steps": 220, "total_steps": 1203, "loss": 0.8278, "lr": 5e-06, "epoch": 0.547945205479452, "percentage": 18.29, "elapsed_time": "3:31:11", "remaining_time": "15:43:36"}
{"current_steps": 230, "total_steps": 1203, "loss": 0.8255, "lr": 5e-06, "epoch": 0.572851805728518, "percentage": 19.12, "elapsed_time": "3:40:46", "remaining_time": "15:33:57"}
{"current_steps": 240, "total_steps": 1203, "loss": 0.8247, "lr": 5e-06, "epoch": 0.597758405977584, "percentage": 19.95, "elapsed_time": "3:50:21", "remaining_time": "15:24:19"}
{"current_steps": 250, "total_steps": 1203, "loss": 0.8211, "lr": 5e-06, "epoch": 0.6226650062266501, "percentage": 20.78, "elapsed_time": "3:59:56", "remaining_time": "15:14:40"}
{"current_steps": 260, "total_steps": 1203, "loss": 0.8205, "lr": 5e-06, "epoch": 0.6475716064757161, "percentage": 21.61, "elapsed_time": "4:09:33", "remaining_time": "15:05:06"}
{"current_steps": 270, "total_steps": 1203, "loss": 0.8175, "lr": 5e-06, "epoch": 0.6724782067247821, "percentage": 22.44, "elapsed_time": "4:19:09", "remaining_time": "14:55:31"}
{"current_steps": 280, "total_steps": 1203, "loss": 0.8266, "lr": 5e-06, "epoch": 0.6973848069738481, "percentage": 23.28, "elapsed_time": "4:28:46", "remaining_time": "14:45:59"}
{"current_steps": 290, "total_steps": 1203, "loss": 0.8213, "lr": 5e-06, "epoch": 0.7222914072229141, "percentage": 24.11, "elapsed_time": "4:38:21", "remaining_time": "14:36:21"}
{"current_steps": 300, "total_steps": 1203, "loss": 0.8197, "lr": 5e-06, "epoch": 0.7471980074719801, "percentage": 24.94, "elapsed_time": "4:47:57", "remaining_time": "14:26:46"}
{"current_steps": 310, "total_steps": 1203, "loss": 0.8171, "lr": 5e-06, "epoch": 0.772104607721046, "percentage": 25.77, "elapsed_time": "4:57:33", "remaining_time": "14:17:10"}
{"current_steps": 320, "total_steps": 1203, "loss": 0.8159, "lr": 5e-06, "epoch": 0.797011207970112, "percentage": 26.6, "elapsed_time": "5:07:09", "remaining_time": "14:07:34"}
{"current_steps": 330, "total_steps": 1203, "loss": 0.8156, "lr": 5e-06, "epoch": 0.821917808219178, "percentage": 27.43, "elapsed_time": "5:16:45", "remaining_time": "13:57:57"}
{"current_steps": 340, "total_steps": 1203, "loss": 0.8136, "lr": 5e-06, "epoch": 0.8468244084682441, "percentage": 28.26, "elapsed_time": "5:26:20", "remaining_time": "13:48:18"}
{"current_steps": 350, "total_steps": 1203, "loss": 0.8091, "lr": 5e-06, "epoch": 0.8717310087173101, "percentage": 29.09, "elapsed_time": "5:35:54", "remaining_time": "13:38:40"}
{"current_steps": 360, "total_steps": 1203, "loss": 0.8127, "lr": 5e-06, "epoch": 0.8966376089663761, "percentage": 29.93, "elapsed_time": "5:45:31", "remaining_time": "13:29:06"}
{"current_steps": 370, "total_steps": 1203, "loss": 0.8139, "lr": 5e-06, "epoch": 0.9215442092154421, "percentage": 30.76, "elapsed_time": "5:55:08", "remaining_time": "13:19:32"}
{"current_steps": 380, "total_steps": 1203, "loss": 0.8148, "lr": 5e-06, "epoch": 0.9464508094645081, "percentage": 31.59, "elapsed_time": "6:04:44", "remaining_time": "13:09:56"}
{"current_steps": 390, "total_steps": 1203, "loss": 0.8133, "lr": 5e-06, "epoch": 0.9713574097135741, "percentage": 32.42, "elapsed_time": "6:14:19", "remaining_time": "13:00:19"}
{"current_steps": 400, "total_steps": 1203, "loss": 0.8102, "lr": 5e-06, "epoch": 0.9962640099626401, "percentage": 33.25, "elapsed_time": "6:23:56", "remaining_time": "12:50:44"}
{"current_steps": 401, "total_steps": 1203, "eval_loss": 0.8109647631645203, "epoch": 0.9987546699875467, "percentage": 33.33, "elapsed_time": "6:32:31", "remaining_time": "13:05:03"}
{"current_steps": 410, "total_steps": 1203, "loss": 0.8079, "lr": 5e-06, "epoch": 1.0211706102117062, "percentage": 34.08, "elapsed_time": "6:41:54", "remaining_time": "12:57:21"}
{"current_steps": 420, "total_steps": 1203, "loss": 0.7693, "lr": 5e-06, "epoch": 1.046077210460772, "percentage": 34.91, "elapsed_time": "6:51:31", "remaining_time": "12:47:11"}
{"current_steps": 430, "total_steps": 1203, "loss": 0.7659, "lr": 5e-06, "epoch": 1.0709838107098382, "percentage": 35.74, "elapsed_time": "7:01:07", "remaining_time": "12:37:02"}
{"current_steps": 440, "total_steps": 1203, "loss": 0.7669, "lr": 5e-06, "epoch": 1.095890410958904, "percentage": 36.58, "elapsed_time": "7:10:42", "remaining_time": "12:26:53"}
{"current_steps": 450, "total_steps": 1203, "loss": 0.7676, "lr": 5e-06, "epoch": 1.1207970112079702, "percentage": 37.41, "elapsed_time": "7:20:19", "remaining_time": "12:16:48"}
{"current_steps": 460, "total_steps": 1203, "loss": 0.7668, "lr": 5e-06, "epoch": 1.145703611457036, "percentage": 38.24, "elapsed_time": "7:29:55", "remaining_time": "12:06:43"}
{"current_steps": 470, "total_steps": 1203, "loss": 0.7653, "lr": 5e-06, "epoch": 1.1706102117061021, "percentage": 39.07, "elapsed_time": "7:39:31", "remaining_time": "11:56:39"}
{"current_steps": 480, "total_steps": 1203, "loss": 0.7691, "lr": 5e-06, "epoch": 1.195516811955168, "percentage": 39.9, "elapsed_time": "7:49:07", "remaining_time": "11:46:37"}
{"current_steps": 490, "total_steps": 1203, "loss": 0.7692, "lr": 5e-06, "epoch": 1.2204234122042341, "percentage": 40.73, "elapsed_time": "7:58:42", "remaining_time": "11:36:34"}
{"current_steps": 500, "total_steps": 1203, "loss": 0.77, "lr": 5e-06, "epoch": 1.2453300124533002, "percentage": 41.56, "elapsed_time": "8:08:17", "remaining_time": "11:26:32"}
{"current_steps": 510, "total_steps": 1203, "loss": 0.7649, "lr": 5e-06, "epoch": 1.270236612702366, "percentage": 42.39, "elapsed_time": "8:17:53", "remaining_time": "11:16:32"}
{"current_steps": 520, "total_steps": 1203, "loss": 0.7682, "lr": 5e-06, "epoch": 1.2951432129514322, "percentage": 43.23, "elapsed_time": "8:27:27", "remaining_time": "11:06:31"}
{"current_steps": 530, "total_steps": 1203, "loss": 0.7712, "lr": 5e-06, "epoch": 1.320049813200498, "percentage": 44.06, "elapsed_time": "8:37:03", "remaining_time": "10:56:34"}
{"current_steps": 540, "total_steps": 1203, "loss": 0.7664, "lr": 5e-06, "epoch": 1.3449564134495642, "percentage": 44.89, "elapsed_time": "8:46:40", "remaining_time": "10:46:38"}
{"current_steps": 550, "total_steps": 1203, "loss": 0.7679, "lr": 5e-06, "epoch": 1.36986301369863, "percentage": 45.72, "elapsed_time": "8:56:16", "remaining_time": "10:36:42"}
{"current_steps": 560, "total_steps": 1203, "loss": 0.7639, "lr": 5e-06, "epoch": 1.3947696139476962, "percentage": 46.55, "elapsed_time": "9:05:52", "remaining_time": "10:26:47"}
{"current_steps": 570, "total_steps": 1203, "loss": 0.7677, "lr": 5e-06, "epoch": 1.419676214196762, "percentage": 47.38, "elapsed_time": "9:15:28", "remaining_time": "10:16:52"}
{"current_steps": 580, "total_steps": 1203, "loss": 0.7626, "lr": 5e-06, "epoch": 1.4445828144458281, "percentage": 48.21, "elapsed_time": "9:25:05", "remaining_time": "10:06:58"}
{"current_steps": 590, "total_steps": 1203, "loss": 0.7639, "lr": 5e-06, "epoch": 1.4694894146948942, "percentage": 49.04, "elapsed_time": "9:34:41", "remaining_time": "9:57:05"}
{"current_steps": 600, "total_steps": 1203, "loss": 0.7612, "lr": 5e-06, "epoch": 1.4943960149439601, "percentage": 49.88, "elapsed_time": "9:44:17", "remaining_time": "9:47:12"}
{"current_steps": 610, "total_steps": 1203, "loss": 0.7685, "lr": 5e-06, "epoch": 1.519302615193026, "percentage": 50.71, "elapsed_time": "9:53:53", "remaining_time": "9:37:20"}
{"current_steps": 620, "total_steps": 1203, "loss": 0.7655, "lr": 5e-06, "epoch": 1.544209215442092, "percentage": 51.54, "elapsed_time": "10:03:30", "remaining_time": "9:27:29"}
{"current_steps": 630, "total_steps": 1203, "loss": 0.7646, "lr": 5e-06, "epoch": 1.5691158156911582, "percentage": 52.37, "elapsed_time": "10:13:06", "remaining_time": "9:17:38"}
{"current_steps": 640, "total_steps": 1203, "loss": 0.7633, "lr": 5e-06, "epoch": 1.5940224159402243, "percentage": 53.2, "elapsed_time": "10:22:42", "remaining_time": "9:07:47"}
{"current_steps": 650, "total_steps": 1203, "loss": 0.7701, "lr": 5e-06, "epoch": 1.6189290161892902, "percentage": 54.03, "elapsed_time": "10:32:17", "remaining_time": "8:57:56"}
{"current_steps": 660, "total_steps": 1203, "loss": 0.7671, "lr": 5e-06, "epoch": 1.643835616438356, "percentage": 54.86, "elapsed_time": "10:41:52", "remaining_time": "8:48:05"}
{"current_steps": 670, "total_steps": 1203, "loss": 0.7627, "lr": 5e-06, "epoch": 1.6687422166874222, "percentage": 55.69, "elapsed_time": "10:51:27", "remaining_time": "8:38:14"}
{"current_steps": 680, "total_steps": 1203, "loss": 0.7665, "lr": 5e-06, "epoch": 1.6936488169364883, "percentage": 56.53, "elapsed_time": "11:01:03", "remaining_time": "8:28:25"}
{"current_steps": 690, "total_steps": 1203, "loss": 0.7612, "lr": 5e-06, "epoch": 1.7185554171855542, "percentage": 57.36, "elapsed_time": "11:10:37", "remaining_time": "8:18:35"}
{"current_steps": 700, "total_steps": 1203, "loss": 0.7625, "lr": 5e-06, "epoch": 1.74346201743462, "percentage": 58.19, "elapsed_time": "11:20:12", "remaining_time": "8:08:46"}
{"current_steps": 710, "total_steps": 1203, "loss": 0.7678, "lr": 5e-06, "epoch": 1.7683686176836861, "percentage": 59.02, "elapsed_time": "11:29:49", "remaining_time": "7:58:59"}
{"current_steps": 720, "total_steps": 1203, "loss": 0.7641, "lr": 5e-06, "epoch": 1.7932752179327522, "percentage": 59.85, "elapsed_time": "11:39:25", "remaining_time": "7:49:12"}
{"current_steps": 730, "total_steps": 1203, "loss": 0.7671, "lr": 5e-06, "epoch": 1.8181818181818183, "percentage": 60.68, "elapsed_time": "11:49:00", "remaining_time": "7:39:24"}
{"current_steps": 740, "total_steps": 1203, "loss": 0.7569, "lr": 5e-06, "epoch": 1.8430884184308842, "percentage": 61.51, "elapsed_time": "11:58:36", "remaining_time": "7:29:36"}
{"current_steps": 750, "total_steps": 1203, "loss": 0.7617, "lr": 5e-06, "epoch": 1.86799501867995, "percentage": 62.34, "elapsed_time": "12:08:12", "remaining_time": "7:19:50"}
{"current_steps": 760, "total_steps": 1203, "loss": 0.7628, "lr": 5e-06, "epoch": 1.8929016189290162, "percentage": 63.18, "elapsed_time": "12:17:47", "remaining_time": "7:10:03"}
{"current_steps": 770, "total_steps": 1203, "loss": 0.7623, "lr": 5e-06, "epoch": 1.9178082191780823, "percentage": 64.01, "elapsed_time": "12:27:22", "remaining_time": "7:00:16"}
{"current_steps": 780, "total_steps": 1203, "loss": 0.7595, "lr": 5e-06, "epoch": 1.9427148194271482, "percentage": 64.84, "elapsed_time": "12:36:57", "remaining_time": "6:50:30"}
{"current_steps": 790, "total_steps": 1203, "loss": 0.7613, "lr": 5e-06, "epoch": 1.967621419676214, "percentage": 65.67, "elapsed_time": "12:46:33", "remaining_time": "6:40:44"}
{"current_steps": 800, "total_steps": 1203, "loss": 0.7613, "lr": 5e-06, "epoch": 1.9925280199252802, "percentage": 66.5, "elapsed_time": "12:56:09", "remaining_time": "6:30:59"}
{"current_steps": 803, "total_steps": 1203, "eval_loss": 0.798328697681427, "epoch": 2.0, "percentage": 66.75, "elapsed_time": "13:06:05", "remaining_time": "6:31:34"}
{"current_steps": 810, "total_steps": 1203, "loss": 0.764, "lr": 5e-06, "epoch": 2.0174346201743463, "percentage": 67.33, "elapsed_time": "13:14:02", "remaining_time": "6:25:15"}
{"current_steps": 820, "total_steps": 1203, "loss": 0.7174, "lr": 5e-06, "epoch": 2.0423412204234124, "percentage": 68.16, "elapsed_time": "13:23:40", "remaining_time": "6:15:22"}
{"current_steps": 830, "total_steps": 1203, "loss": 0.7136, "lr": 5e-06, "epoch": 2.067247820672478, "percentage": 68.99, "elapsed_time": "13:33:18", "remaining_time": "6:05:29"}
{"current_steps": 840, "total_steps": 1203, "loss": 0.7141, "lr": 5e-06, "epoch": 2.092154420921544, "percentage": 69.83, "elapsed_time": "13:42:57", "remaining_time": "5:55:38"}
{"current_steps": 850, "total_steps": 1203, "loss": 0.7205, "lr": 5e-06, "epoch": 2.1170610211706102, "percentage": 70.66, "elapsed_time": "13:52:35", "remaining_time": "5:45:46"}
{"current_steps": 860, "total_steps": 1203, "loss": 0.7182, "lr": 5e-06, "epoch": 2.1419676214196763, "percentage": 71.49, "elapsed_time": "14:02:13", "remaining_time": "5:35:54"}
{"current_steps": 870, "total_steps": 1203, "loss": 0.7174, "lr": 5e-06, "epoch": 2.166874221668742, "percentage": 72.32, "elapsed_time": "14:11:50", "remaining_time": "5:26:03"}
{"current_steps": 880, "total_steps": 1203, "loss": 0.7227, "lr": 5e-06, "epoch": 2.191780821917808, "percentage": 73.15, "elapsed_time": "14:21:27", "remaining_time": "5:16:11"}
{"current_steps": 890, "total_steps": 1203, "loss": 0.7154, "lr": 5e-06, "epoch": 2.216687422166874, "percentage": 73.98, "elapsed_time": "14:31:05", "remaining_time": "5:06:20"}
{"current_steps": 900, "total_steps": 1203, "loss": 0.7181, "lr": 5e-06, "epoch": 2.2415940224159403, "percentage": 74.81, "elapsed_time": "14:40:41", "remaining_time": "4:56:29"}
{"current_steps": 910, "total_steps": 1203, "loss": 0.7188, "lr": 5e-06, "epoch": 2.2665006226650064, "percentage": 75.64, "elapsed_time": "14:50:18", "remaining_time": "4:46:39"}
{"current_steps": 920, "total_steps": 1203, "loss": 0.7189, "lr": 5e-06, "epoch": 2.291407222914072, "percentage": 76.48, "elapsed_time": "14:59:56", "remaining_time": "4:36:49"}
{"current_steps": 930, "total_steps": 1203, "loss": 0.7208, "lr": 5e-06, "epoch": 2.316313823163138, "percentage": 77.31, "elapsed_time": "15:09:33", "remaining_time": "4:26:59"}
{"current_steps": 940, "total_steps": 1203, "loss": 0.7191, "lr": 5e-06, "epoch": 2.3412204234122043, "percentage": 78.14, "elapsed_time": "15:19:10", "remaining_time": "4:17:10"}
{"current_steps": 950, "total_steps": 1203, "loss": 0.7254, "lr": 5e-06, "epoch": 2.3661270236612704, "percentage": 78.97, "elapsed_time": "15:28:47", "remaining_time": "4:07:21"}
{"current_steps": 960, "total_steps": 1203, "loss": 0.7177, "lr": 5e-06, "epoch": 2.391033623910336, "percentage": 79.8, "elapsed_time": "15:38:25", "remaining_time": "3:57:32"}
{"current_steps": 970, "total_steps": 1203, "loss": 0.7162, "lr": 5e-06, "epoch": 2.415940224159402, "percentage": 80.63, "elapsed_time": "15:48:02", "remaining_time": "3:47:43"}
{"current_steps": 980, "total_steps": 1203, "loss": 0.7238, "lr": 5e-06, "epoch": 2.4408468244084682, "percentage": 81.46, "elapsed_time": "15:57:40", "remaining_time": "3:37:55"}
{"current_steps": 990, "total_steps": 1203, "loss": 0.7217, "lr": 5e-06, "epoch": 2.4657534246575343, "percentage": 82.29, "elapsed_time": "16:07:17", "remaining_time": "3:28:06"}
{"current_steps": 1000, "total_steps": 1203, "loss": 0.7211, "lr": 5e-06, "epoch": 2.4906600249066004, "percentage": 83.13, "elapsed_time": "16:16:55", "remaining_time": "3:18:18"}
{"current_steps": 1010, "total_steps": 1203, "loss": 0.722, "lr": 5e-06, "epoch": 2.515566625155666, "percentage": 83.96, "elapsed_time": "16:26:33", "remaining_time": "3:08:31"}
{"current_steps": 1020, "total_steps": 1203, "loss": 0.7226, "lr": 5e-06, "epoch": 2.540473225404732, "percentage": 84.79, "elapsed_time": "16:36:10", "remaining_time": "2:58:43"}
{"current_steps": 1030, "total_steps": 1203, "loss": 0.7201, "lr": 5e-06, "epoch": 2.5653798256537983, "percentage": 85.62, "elapsed_time": "16:45:47", "remaining_time": "2:48:56"}
{"current_steps": 1040, "total_steps": 1203, "loss": 0.7225, "lr": 5e-06, "epoch": 2.5902864259028644, "percentage": 86.45, "elapsed_time": "16:55:25", "remaining_time": "2:39:08"}
{"current_steps": 1050, "total_steps": 1203, "loss": 0.7184, "lr": 5e-06, "epoch": 2.61519302615193, "percentage": 87.28, "elapsed_time": "17:05:03", "remaining_time": "2:29:21"}
{"current_steps": 1060, "total_steps": 1203, "loss": 0.7228, "lr": 5e-06, "epoch": 2.640099626400996, "percentage": 88.11, "elapsed_time": "17:14:41", "remaining_time": "2:19:35"}
{"current_steps": 1070, "total_steps": 1203, "loss": 0.7219, "lr": 5e-06, "epoch": 2.6650062266500623, "percentage": 88.94, "elapsed_time": "17:24:19", "remaining_time": "2:09:48"}
{"current_steps": 1080, "total_steps": 1203, "loss": 0.7231, "lr": 5e-06, "epoch": 2.6899128268991284, "percentage": 89.78, "elapsed_time": "17:33:57", "remaining_time": "2:00:01"}
{"current_steps": 1090, "total_steps": 1203, "loss": 0.7207, "lr": 5e-06, "epoch": 2.7148194271481945, "percentage": 90.61, "elapsed_time": "17:43:34", "remaining_time": "1:50:15"}
{"current_steps": 1100, "total_steps": 1203, "loss": 0.7225, "lr": 5e-06, "epoch": 2.73972602739726, "percentage": 91.44, "elapsed_time": "17:53:11", "remaining_time": "1:40:29"}
{"current_steps": 1110, "total_steps": 1203, "loss": 0.7199, "lr": 5e-06, "epoch": 2.7646326276463262, "percentage": 92.27, "elapsed_time": "18:02:48", "remaining_time": "1:30:43"}
{"current_steps": 1120, "total_steps": 1203, "loss": 0.723, "lr": 5e-06, "epoch": 2.7895392278953923, "percentage": 93.1, "elapsed_time": "18:12:25", "remaining_time": "1:20:57"}
{"current_steps": 1130, "total_steps": 1203, "loss": 0.7195, "lr": 5e-06, "epoch": 2.8144458281444584, "percentage": 93.93, "elapsed_time": "18:22:02", "remaining_time": "1:11:11"}
{"current_steps": 1140, "total_steps": 1203, "loss": 0.7241, "lr": 5e-06, "epoch": 2.839352428393524, "percentage": 94.76, "elapsed_time": "18:31:40", "remaining_time": "1:01:26"}
{"current_steps": 1150, "total_steps": 1203, "loss": 0.7218, "lr": 5e-06, "epoch": 2.86425902864259, "percentage": 95.59, "elapsed_time": "18:41:17", "remaining_time": "0:51:40"}
{"current_steps": 1160, "total_steps": 1203, "loss": 0.7223, "lr": 5e-06, "epoch": 2.8891656288916563, "percentage": 96.43, "elapsed_time": "18:50:54", "remaining_time": "0:41:55"}
{"current_steps": 1170, "total_steps": 1203, "loss": 0.7248, "lr": 5e-06, "epoch": 2.9140722291407224, "percentage": 97.26, "elapsed_time": "19:00:31", "remaining_time": "0:32:10"}
{"current_steps": 1180, "total_steps": 1203, "loss": 0.7186, "lr": 5e-06, "epoch": 2.9389788293897885, "percentage": 98.09, "elapsed_time": "19:10:08", "remaining_time": "0:22:25"}
{"current_steps": 1190, "total_steps": 1203, "loss": 0.7225, "lr": 5e-06, "epoch": 2.963885429638854, "percentage": 98.92, "elapsed_time": "19:19:43", "remaining_time": "0:12:40"}
{"current_steps": 1200, "total_steps": 1203, "loss": 0.7228, "lr": 5e-06, "epoch": 2.9887920298879203, "percentage": 99.75, "elapsed_time": "19:29:22", "remaining_time": "0:02:55"}
{"current_steps": 1203, "total_steps": 1203, "eval_loss": 0.7962795495986938, "epoch": 2.99626400996264, "percentage": 100.0, "elapsed_time": "19:40:42", "remaining_time": "0:00:00"}
{"current_steps": 1203, "total_steps": 1203, "epoch": 2.99626400996264, "percentage": 100.0, "elapsed_time": "19:42:13", "remaining_time": "0:00:00"}