{"current_steps": 5, "total_steps": 40000, "loss": 3.6004, "lr": 0.29999999259779675, "epoch": 0.00024430166369432974, "percentage": 0.01, "elapsed_time": "0:00:04", "remaining_time": "10:59:38", "throughput": 1267.59, "total_tokens": 6272} {"current_steps": 10, "total_steps": 40000, "loss": 0.5392, "lr": 0.29999996252634736, "epoch": 0.0004886033273886595, "percentage": 0.03, "elapsed_time": "0:00:08", "remaining_time": "8:59:04", "throughput": 1606.28, "total_tokens": 12992} {"current_steps": 15, "total_steps": 40000, "loss": 0.2136, "lr": 0.2999999093230187, "epoch": 0.0007329049910829893, "percentage": 0.04, "elapsed_time": "0:00:11", "remaining_time": "8:18:28", "throughput": 1745.49, "total_tokens": 19584} {"current_steps": 20, "total_steps": 40000, "loss": 0.1897, "lr": 0.299999832987819, "epoch": 0.000977206654777319, "percentage": 0.05, "elapsed_time": "0:00:14", "remaining_time": "7:58:10", "throughput": 1826.05, "total_tokens": 26208} {"current_steps": 25, "total_steps": 40000, "loss": 0.1866, "lr": 0.29999973352076004, "epoch": 0.0012215083184716488, "percentage": 0.06, "elapsed_time": "0:00:17", "remaining_time": "7:42:33", "throughput": 1865.79, "total_tokens": 32384} {"current_steps": 30, "total_steps": 40000, "loss": 0.1684, "lr": 0.2999996109218572, "epoch": 0.0014658099821659785, "percentage": 0.07, "elapsed_time": "0:00:20", "remaining_time": "7:31:55", "throughput": 1886.79, "total_tokens": 38400} {"current_steps": 35, "total_steps": 40000, "loss": 0.1906, "lr": 0.2999994651911293, "epoch": 0.0017101116458603082, "percentage": 0.09, "elapsed_time": "0:00:23", "remaining_time": "7:24:59", "throughput": 1906.41, "total_tokens": 44576} {"current_steps": 40, "total_steps": 40000, "loss": 0.1866, "lr": 0.2999992963285989, "epoch": 0.001954413309554638, "percentage": 0.1, "elapsed_time": "0:00:26", "remaining_time": "7:20:28", "throughput": 1920.81, "total_tokens": 50816} {"current_steps": 45, "total_steps": 40000, "loss": 0.1901, "lr": 0.29999910433429194, "epoch": 0.002198714973248968, "percentage": 0.11, "elapsed_time": "0:00:29", "remaining_time": "7:16:14", "throughput": 1930.02, "total_tokens": 56896} {"current_steps": 50, "total_steps": 40000, "loss": 0.1818, "lr": 0.29999888920823814, "epoch": 0.0024430166369432977, "percentage": 0.12, "elapsed_time": "0:00:32", "remaining_time": "7:12:29", "throughput": 1939.04, "total_tokens": 62976} {"current_steps": 55, "total_steps": 40000, "loss": 0.1841, "lr": 0.29999865095047057, "epoch": 0.0026873183006376274, "percentage": 0.14, "elapsed_time": "0:00:35", "remaining_time": "7:12:06", "throughput": 1959.58, "total_tokens": 69952} {"current_steps": 60, "total_steps": 40000, "loss": 0.2057, "lr": 0.29999838956102604, "epoch": 0.002931619964331957, "percentage": 0.15, "elapsed_time": "0:00:38", "remaining_time": "7:11:04", "throughput": 1969.98, "total_tokens": 76544} {"current_steps": 65, "total_steps": 40000, "loss": 0.2032, "lr": 0.29999810503994484, "epoch": 0.0031759216280262867, "percentage": 0.16, "elapsed_time": "0:00:41", "remaining_time": "7:09:27", "throughput": 1973.86, "total_tokens": 82784} {"current_steps": 70, "total_steps": 40000, "loss": 0.1567, "lr": 0.29999779738727084, "epoch": 0.0034202232917206164, "percentage": 0.18, "elapsed_time": "0:00:45", "remaining_time": "7:08:30", "throughput": 1979.43, "total_tokens": 89216} {"current_steps": 75, "total_steps": 40000, "loss": 0.161, "lr": 0.29999746660305154, "epoch": 0.0036645249554149465, "percentage": 0.19, "elapsed_time": "0:00:48", "remaining_time": "7:07:48", "throughput": 1988.23, "total_tokens": 95872} {"current_steps": 80, "total_steps": 40000, "loss": 0.1642, "lr": 0.2999971126873379, "epoch": 0.003908826619109276, "percentage": 0.2, "elapsed_time": "0:00:51", "remaining_time": "7:06:21", "throughput": 1990.6, "total_tokens": 102048} {"current_steps": 85, "total_steps": 40000, "loss": 0.1645, "lr": 0.2999967356401845, "epoch": 0.004153128282803606, "percentage": 0.21, "elapsed_time": "0:00:54", "remaining_time": "7:05:14", "throughput": 1994.81, "total_tokens": 108384} {"current_steps": 90, "total_steps": 40000, "loss": 0.1989, "lr": 0.29999633546164944, "epoch": 0.004397429946497936, "percentage": 0.22, "elapsed_time": "0:00:57", "remaining_time": "7:04:03", "throughput": 1995.5, "total_tokens": 114496} {"current_steps": 95, "total_steps": 40000, "loss": 0.1727, "lr": 0.29999591215179444, "epoch": 0.004641731610192265, "percentage": 0.24, "elapsed_time": "0:01:00", "remaining_time": "7:03:35", "throughput": 1996.52, "total_tokens": 120800} {"current_steps": 100, "total_steps": 40000, "loss": 0.1774, "lr": 0.2999954657106849, "epoch": 0.004886033273886595, "percentage": 0.25, "elapsed_time": "0:01:03", "remaining_time": "7:02:22", "throughput": 1996.66, "total_tokens": 126816} {"current_steps": 105, "total_steps": 40000, "loss": 0.1498, "lr": 0.2999949961383896, "epoch": 0.005130334937580925, "percentage": 0.26, "elapsed_time": "0:01:06", "remaining_time": "7:02:11", "throughput": 2003.41, "total_tokens": 133568} {"current_steps": 110, "total_steps": 40000, "loss": 0.1772, "lr": 0.2999945034349809, "epoch": 0.005374636601275255, "percentage": 0.27, "elapsed_time": "0:01:09", "remaining_time": "7:01:43", "throughput": 2009.62, "total_tokens": 140224} {"current_steps": 115, "total_steps": 40000, "loss": 0.1642, "lr": 0.2999939876005348, "epoch": 0.005618938264969585, "percentage": 0.29, "elapsed_time": "0:01:12", "remaining_time": "7:01:02", "throughput": 2013.42, "total_tokens": 146656} {"current_steps": 120, "total_steps": 40000, "loss": 0.1588, "lr": 0.29999344863513094, "epoch": 0.005863239928663914, "percentage": 0.3, "elapsed_time": "0:01:15", "remaining_time": "7:00:56", "throughput": 2020.72, "total_tokens": 153568} {"current_steps": 125, "total_steps": 40000, "loss": 0.1701, "lr": 0.2999928865388523, "epoch": 0.006107541592358244, "percentage": 0.31, "elapsed_time": "0:01:19", "remaining_time": "7:00:24", "throughput": 2023.04, "total_tokens": 159968} {"current_steps": 130, "total_steps": 40000, "loss": 0.1571, "lr": 0.29999230131178567, "epoch": 0.0063518432560525735, "percentage": 0.33, "elapsed_time": "0:01:22", "remaining_time": "6:59:46", "throughput": 2024.26, "total_tokens": 166240} {"current_steps": 135, "total_steps": 40000, "loss": 0.1684, "lr": 0.2999916929540212, "epoch": 0.006596144919746904, "percentage": 0.34, "elapsed_time": "0:01:25", "remaining_time": "6:59:33", "throughput": 2025.52, "total_tokens": 172672} {"current_steps": 140, "total_steps": 40000, "loss": 0.1937, "lr": 0.29999106146565285, "epoch": 0.006840446583441233, "percentage": 0.35, "elapsed_time": "0:01:28", "remaining_time": "6:58:29", "throughput": 2023.24, "total_tokens": 178432} {"current_steps": 145, "total_steps": 40000, "loss": 0.1481, "lr": 0.29999040684677786, "epoch": 0.007084748247135563, "percentage": 0.36, "elapsed_time": "0:01:31", "remaining_time": "6:57:53", "throughput": 2024.05, "total_tokens": 184640} {"current_steps": 150, "total_steps": 40000, "loss": 0.1524, "lr": 0.2999897290974972, "epoch": 0.007329049910829893, "percentage": 0.38, "elapsed_time": "0:01:34", "remaining_time": "6:57:40", "throughput": 2025.2, "total_tokens": 191040} {"current_steps": 155, "total_steps": 40000, "loss": 0.17, "lr": 0.2999890282179155, "epoch": 0.007573351574524222, "percentage": 0.39, "elapsed_time": "0:01:37", "remaining_time": "6:57:14", "throughput": 2026.73, "total_tokens": 197376} {"current_steps": 160, "total_steps": 40000, "loss": 0.1457, "lr": 0.29998830420814077, "epoch": 0.007817653238218552, "percentage": 0.4, "elapsed_time": "0:01:40", "remaining_time": "6:57:51", "throughput": 2032.39, "total_tokens": 204640} {"current_steps": 165, "total_steps": 40000, "loss": 0.1602, "lr": 0.2999875570682846, "epoch": 0.008061954901912883, "percentage": 0.41, "elapsed_time": "0:01:43", "remaining_time": "6:57:22", "throughput": 2033.02, "total_tokens": 210880} {"current_steps": 170, "total_steps": 40000, "loss": 0.1372, "lr": 0.2999867867984623, "epoch": 0.008306256565607212, "percentage": 0.43, "elapsed_time": "0:01:46", "remaining_time": "6:57:11", "throughput": 2035.54, "total_tokens": 217472} {"current_steps": 175, "total_steps": 40000, "loss": 0.1653, "lr": 0.29998599339879267, "epoch": 0.008550558229301541, "percentage": 0.44, "elapsed_time": "0:01:49", "remaining_time": "6:56:56", "throughput": 2037.43, "total_tokens": 223968} {"current_steps": 180, "total_steps": 40000, "loss": 0.1519, "lr": 0.29998517686939796, "epoch": 0.008794859892995872, "percentage": 0.45, "elapsed_time": "0:01:52", "remaining_time": "6:56:36", "throughput": 2038.51, "total_tokens": 230336} {"current_steps": 185, "total_steps": 40000, "loss": 0.1735, "lr": 0.29998433721040413, "epoch": 0.009039161556690201, "percentage": 0.46, "elapsed_time": "0:01:56", "remaining_time": "6:56:18", "throughput": 2038.87, "total_tokens": 236640} {"current_steps": 190, "total_steps": 40000, "loss": 0.1881, "lr": 0.29998347442194073, "epoch": 0.00928346322038453, "percentage": 0.47, "elapsed_time": "0:01:59", "remaining_time": "6:55:44", "throughput": 2037.98, "total_tokens": 242624} {"current_steps": 195, "total_steps": 40000, "loss": 0.1541, "lr": 0.2999825885041407, "epoch": 0.00952776488407886, "percentage": 0.49, "elapsed_time": "0:02:02", "remaining_time": "6:55:23", "throughput": 2039.02, "total_tokens": 248960} {"current_steps": 200, "total_steps": 40000, "loss": 0.2032, "lr": 0.29998167945714077, "epoch": 0.00977206654777319, "percentage": 0.5, "elapsed_time": "0:02:05", "remaining_time": "6:54:56", "throughput": 2037.75, "total_tokens": 254944} {"current_steps": 200, "total_steps": 40000, "eval_loss": 0.19676335155963898, "epoch": 0.00977206654777319, "percentage": 0.5, "elapsed_time": "0:12:43", "remaining_time": "1 day, 18:10:47", "throughput": 334.11, "total_tokens": 254944} {"current_steps": 205, "total_steps": 40000, "loss": 0.1893, "lr": 0.2999807472810811, "epoch": 0.01001636821146752, "percentage": 0.51, "elapsed_time": "0:12:47", "remaining_time": "1 day, 17:21:54", "throughput": 340.56, "total_tokens": 261248} {"current_steps": 210, "total_steps": 40000, "loss": 0.1975, "lr": 0.29997979197610536, "epoch": 0.01026066987516185, "percentage": 0.53, "elapsed_time": "0:12:50", "remaining_time": "1 day, 16:31:56", "throughput": 347.05, "total_tokens": 267264} {"current_steps": 215, "total_steps": 40000, "loss": 0.1838, "lr": 0.299978813542361, "epoch": 0.01050497153885618, "percentage": 0.54, "elapsed_time": "0:12:53", "remaining_time": "1 day, 15:44:39", "throughput": 354.14, "total_tokens": 273824} {"current_steps": 220, "total_steps": 40000, "loss": 0.1911, "lr": 0.2999778119799988, "epoch": 0.01074927320255051, "percentage": 0.55, "elapsed_time": "0:12:56", "remaining_time": "1 day, 14:59:36", "throughput": 361.41, "total_tokens": 280576} {"current_steps": 225, "total_steps": 40000, "loss": 0.157, "lr": 0.29997678728917326, "epoch": 0.010993574866244839, "percentage": 0.56, "elapsed_time": "0:12:59", "remaining_time": "1 day, 14:16:23", "throughput": 367.86, "total_tokens": 286720} {"current_steps": 230, "total_steps": 40000, "loss": 0.1402, "lr": 0.2999757394700424, "epoch": 0.01123787652993917, "percentage": 0.57, "elapsed_time": "0:13:02", "remaining_time": "1 day, 13:35:02", "throughput": 374.56, "total_tokens": 293088} {"current_steps": 235, "total_steps": 40000, "loss": 0.1702, "lr": 0.29997466852276783, "epoch": 0.011482178193633499, "percentage": 0.59, "elapsed_time": "0:13:05", "remaining_time": "1 day, 12:55:25", "throughput": 381.16, "total_tokens": 299424} {"current_steps": 240, "total_steps": 40000, "loss": 0.1787, "lr": 0.29997357444751466, "epoch": 0.011726479857327828, "percentage": 0.6, "elapsed_time": "0:13:08", "remaining_time": "1 day, 12:17:37", "throughput": 387.97, "total_tokens": 305984} {"current_steps": 245, "total_steps": 40000, "loss": 0.173, "lr": 0.2999724572444516, "epoch": 0.011970781521022157, "percentage": 0.61, "elapsed_time": "0:13:11", "remaining_time": "1 day, 11:41:24", "throughput": 394.35, "total_tokens": 312256} {"current_steps": 250, "total_steps": 40000, "loss": 0.1599, "lr": 0.29997131691375095, "epoch": 0.012215083184716488, "percentage": 0.62, "elapsed_time": "0:13:14", "remaining_time": "1 day, 11:06:43", "throughput": 400.91, "total_tokens": 318720} {"current_steps": 255, "total_steps": 40000, "loss": 0.1378, "lr": 0.2999701534555886, "epoch": 0.012459384848410818, "percentage": 0.64, "elapsed_time": "0:13:18", "remaining_time": "1 day, 10:33:07", "throughput": 406.99, "total_tokens": 324800} {"current_steps": 260, "total_steps": 40000, "loss": 0.1661, "lr": 0.2999689668701439, "epoch": 0.012703686512105147, "percentage": 0.65, "elapsed_time": "0:13:21", "remaining_time": "1 day, 10:00:44", "throughput": 413.12, "total_tokens": 330944} {"current_steps": 265, "total_steps": 40000, "loss": 0.1688, "lr": 0.29996775715759993, "epoch": 0.012947988175799478, "percentage": 0.66, "elapsed_time": "0:13:24", "remaining_time": "1 day, 9:29:46", "throughput": 419.39, "total_tokens": 337280} {"current_steps": 270, "total_steps": 40000, "loss": 0.1489, "lr": 0.2999665243181432, "epoch": 0.013192289839493807, "percentage": 0.68, "elapsed_time": "0:13:27", "remaining_time": "1 day, 8:59:52", "throughput": 425.56, "total_tokens": 343552} {"current_steps": 275, "total_steps": 40000, "loss": 0.1882, "lr": 0.2999652683519638, "epoch": 0.013436591503188136, "percentage": 0.69, "elapsed_time": "0:13:30", "remaining_time": "1 day, 8:31:19", "throughput": 432.21, "total_tokens": 350304} {"current_steps": 280, "total_steps": 40000, "loss": 0.1733, "lr": 0.29996398925925544, "epoch": 0.013680893166882466, "percentage": 0.7, "elapsed_time": "0:13:33", "remaining_time": "1 day, 8:03:34", "throughput": 438.62, "total_tokens": 356864} {"current_steps": 285, "total_steps": 40000, "loss": 0.1574, "lr": 0.2999626870402154, "epoch": 0.013925194830576797, "percentage": 0.71, "elapsed_time": "0:13:36", "remaining_time": "1 day, 7:36:53", "throughput": 444.89, "total_tokens": 363360} {"current_steps": 290, "total_steps": 40000, "loss": 0.1558, "lr": 0.29996136169504445, "epoch": 0.014169496494271126, "percentage": 0.73, "elapsed_time": "0:13:39", "remaining_time": "1 day, 7:10:54", "throughput": 450.92, "total_tokens": 369664} {"current_steps": 295, "total_steps": 40000, "loss": 0.136, "lr": 0.29996001322394694, "epoch": 0.014413798157965455, "percentage": 0.74, "elapsed_time": "0:13:42", "remaining_time": "1 day, 6:45:41", "throughput": 456.59, "total_tokens": 375680} {"current_steps": 300, "total_steps": 40000, "loss": 0.2029, "lr": 0.29995864162713093, "epoch": 0.014658099821659786, "percentage": 0.75, "elapsed_time": "0:13:45", "remaining_time": "1 day, 6:21:28", "throughput": 462.37, "total_tokens": 381856} {"current_steps": 305, "total_steps": 40000, "loss": 0.1512, "lr": 0.2999572469048079, "epoch": 0.014902401485354115, "percentage": 0.76, "elapsed_time": "0:13:48", "remaining_time": "1 day, 5:57:56", "throughput": 467.99, "total_tokens": 387904} {"current_steps": 310, "total_steps": 40000, "loss": 0.1587, "lr": 0.29995582905719287, "epoch": 0.015146703149048445, "percentage": 0.78, "elapsed_time": "0:13:52", "remaining_time": "1 day, 5:35:23", "throughput": 474.0, "total_tokens": 394368} {"current_steps": 315, "total_steps": 40000, "loss": 0.1662, "lr": 0.2999543880845046, "epoch": 0.015391004812742774, "percentage": 0.79, "elapsed_time": "0:13:55", "remaining_time": "1 day, 5:13:23", "throughput": 479.66, "total_tokens": 400544} {"current_steps": 320, "total_steps": 40000, "loss": 0.1631, "lr": 0.2999529239869652, "epoch": 0.015635306476437103, "percentage": 0.8, "elapsed_time": "0:13:58", "remaining_time": "1 day, 4:52:05", "throughput": 485.67, "total_tokens": 407040} {"current_steps": 325, "total_steps": 40000, "loss": 0.1742, "lr": 0.2999514367648005, "epoch": 0.015879608140131434, "percentage": 0.81, "elapsed_time": "0:14:01", "remaining_time": "1 day, 4:31:31", "throughput": 491.07, "total_tokens": 413088} {"current_steps": 330, "total_steps": 40000, "loss": 0.1977, "lr": 0.29994992641823987, "epoch": 0.016123909803825765, "percentage": 0.83, "elapsed_time": "0:14:04", "remaining_time": "1 day, 4:11:43", "throughput": 497.18, "total_tokens": 419808} {"current_steps": 335, "total_steps": 40000, "loss": 0.1847, "lr": 0.29994839294751613, "epoch": 0.016368211467520093, "percentage": 0.84, "elapsed_time": "0:14:07", "remaining_time": "1 day, 3:52:20", "throughput": 502.59, "total_tokens": 425920} {"current_steps": 340, "total_steps": 40000, "loss": 0.1491, "lr": 0.29994683635286584, "epoch": 0.016612513131214424, "percentage": 0.85, "elapsed_time": "0:14:10", "remaining_time": "1 day, 3:33:30", "throughput": 508.37, "total_tokens": 432384} {"current_steps": 345, "total_steps": 40000, "loss": 0.1728, "lr": 0.2999452566345291, "epoch": 0.016856814794908755, "percentage": 0.86, "elapsed_time": "0:14:13", "remaining_time": "1 day, 3:15:20", "throughput": 514.27, "total_tokens": 439008} {"current_steps": 350, "total_steps": 40000, "loss": 0.1641, "lr": 0.2999436537927494, "epoch": 0.017101116458603082, "percentage": 0.88, "elapsed_time": "0:14:16", "remaining_time": "1 day, 2:57:27", "throughput": 519.38, "total_tokens": 444928} {"current_steps": 355, "total_steps": 40000, "loss": 0.1379, "lr": 0.299942027827774, "epoch": 0.017345418122297413, "percentage": 0.89, "elapsed_time": "0:14:19", "remaining_time": "1 day, 2:40:15", "throughput": 524.94, "total_tokens": 451328} {"current_steps": 360, "total_steps": 40000, "loss": 0.1416, "lr": 0.29994037873985363, "epoch": 0.017589719785991744, "percentage": 0.9, "elapsed_time": "0:14:22", "remaining_time": "1 day, 2:23:26", "throughput": 530.31, "total_tokens": 457568} {"current_steps": 365, "total_steps": 40000, "loss": 0.1665, "lr": 0.29993870652924254, "epoch": 0.01783402144968607, "percentage": 0.91, "elapsed_time": "0:14:25", "remaining_time": "1 day, 2:06:57", "throughput": 535.29, "total_tokens": 463456} {"current_steps": 370, "total_steps": 40000, "loss": 0.1688, "lr": 0.29993701119619876, "epoch": 0.018078323113380403, "percentage": 0.92, "elapsed_time": "0:14:28", "remaining_time": "1 day, 1:50:59", "throughput": 540.68, "total_tokens": 469760} {"current_steps": 375, "total_steps": 40000, "loss": 0.1522, "lr": 0.2999352927409835, "epoch": 0.018322624777074734, "percentage": 0.94, "elapsed_time": "0:14:31", "remaining_time": "1 day, 1:35:32", "throughput": 545.89, "total_tokens": 475968} {"current_steps": 380, "total_steps": 40000, "loss": 0.1384, "lr": 0.29993355116386194, "epoch": 0.01856692644076906, "percentage": 0.95, "elapsed_time": "0:14:34", "remaining_time": "1 day, 1:20:26", "throughput": 551.05, "total_tokens": 482144} {"current_steps": 385, "total_steps": 40000, "loss": 0.1617, "lr": 0.29993178646510266, "epoch": 0.018811228104463392, "percentage": 0.96, "elapsed_time": "0:14:38", "remaining_time": "1 day, 1:05:43", "throughput": 556.21, "total_tokens": 488352} {"current_steps": 390, "total_steps": 40000, "loss": 0.1331, "lr": 0.2999299986449777, "epoch": 0.01905552976815772, "percentage": 0.97, "elapsed_time": "0:14:41", "remaining_time": "1 day, 0:51:27", "throughput": 561.41, "total_tokens": 494656} {"current_steps": 395, "total_steps": 40000, "loss": 0.1529, "lr": 0.29992818770376284, "epoch": 0.01929983143185205, "percentage": 0.99, "elapsed_time": "0:14:44", "remaining_time": "1 day, 0:37:27", "throughput": 566.47, "total_tokens": 500832} {"current_steps": 400, "total_steps": 40000, "loss": 0.1317, "lr": 0.29992635364173725, "epoch": 0.01954413309554638, "percentage": 1.0, "elapsed_time": "0:14:47", "remaining_time": "1 day, 0:24:03", "throughput": 571.94, "total_tokens": 507488} {"current_steps": 400, "total_steps": 40000, "eval_loss": 0.17288938164710999, "epoch": 0.01954413309554638, "percentage": 1.0, "elapsed_time": "0:25:25", "remaining_time": "1 day, 17:57:05", "throughput": 332.67, "total_tokens": 507488} {"current_steps": 405, "total_steps": 40000, "loss": 0.1434, "lr": 0.2999244964591839, "epoch": 0.01978843475924071, "percentage": 1.01, "elapsed_time": "0:25:29", "remaining_time": "1 day, 17:31:58", "throughput": 336.5, "total_tokens": 514624} {"current_steps": 410, "total_steps": 40000, "loss": 0.166, "lr": 0.2999226161563891, "epoch": 0.02003273642293504, "percentage": 1.03, "elapsed_time": "0:25:32", "remaining_time": "1 day, 17:06:14", "throughput": 339.87, "total_tokens": 520832} {"current_steps": 415, "total_steps": 40000, "loss": 0.1758, "lr": 0.2999207127336429, "epoch": 0.02027703808662937, "percentage": 1.04, "elapsed_time": "0:25:35", "remaining_time": "1 day, 16:41:10", "throughput": 343.43, "total_tokens": 527360} {"current_steps": 420, "total_steps": 40000, "loss": 0.1148, "lr": 0.2999187861912387, "epoch": 0.0205213397503237, "percentage": 1.05, "elapsed_time": "0:25:38", "remaining_time": "1 day, 16:16:53", "throughput": 347.26, "total_tokens": 534368} {"current_steps": 425, "total_steps": 40000, "loss": 0.1442, "lr": 0.2999168365294737, "epoch": 0.02076564141401803, "percentage": 1.06, "elapsed_time": "0:25:41", "remaining_time": "1 day, 15:52:53", "throughput": 350.66, "total_tokens": 540672} {"current_steps": 430, "total_steps": 40000, "loss": 0.136, "lr": 0.29991486374864856, "epoch": 0.02100994307771236, "percentage": 1.07, "elapsed_time": "0:25:44", "remaining_time": "1 day, 15:29:27", "throughput": 353.91, "total_tokens": 546752} {"current_steps": 435, "total_steps": 40000, "loss": 0.1715, "lr": 0.29991286784906745, "epoch": 0.021254244741406688, "percentage": 1.09, "elapsed_time": "0:25:47", "remaining_time": "1 day, 15:06:29", "throughput": 357.14, "total_tokens": 552832} {"current_steps": 440, "total_steps": 40000, "loss": 0.152, "lr": 0.2999108488310382, "epoch": 0.02149854640510102, "percentage": 1.1, "elapsed_time": "0:25:50", "remaining_time": "1 day, 14:43:59", "throughput": 360.24, "total_tokens": 558688} {"current_steps": 445, "total_steps": 40000, "loss": 0.1538, "lr": 0.29990880669487213, "epoch": 0.02174284806879535, "percentage": 1.11, "elapsed_time": "0:25:53", "remaining_time": "1 day, 14:22:08", "throughput": 363.66, "total_tokens": 565120} {"current_steps": 450, "total_steps": 40000, "loss": 0.1515, "lr": 0.29990674144088425, "epoch": 0.021987149732489678, "percentage": 1.12, "elapsed_time": "0:25:57", "remaining_time": "1 day, 14:00:50", "throughput": 366.98, "total_tokens": 571424} {"current_steps": 455, "total_steps": 40000, "loss": 0.1595, "lr": 0.299904653069393, "epoch": 0.02223145139618401, "percentage": 1.14, "elapsed_time": "0:26:00", "remaining_time": "1 day, 13:40:08", "throughput": 370.72, "total_tokens": 578432} {"current_steps": 460, "total_steps": 40000, "loss": 0.1602, "lr": 0.29990254158072044, "epoch": 0.02247575305987834, "percentage": 1.15, "elapsed_time": "0:26:03", "remaining_time": "1 day, 13:19:32", "throughput": 373.74, "total_tokens": 584256} {"current_steps": 465, "total_steps": 40000, "loss": 0.1603, "lr": 0.2999004069751921, "epoch": 0.022720054723572667, "percentage": 1.16, "elapsed_time": "0:26:06", "remaining_time": "1 day, 12:59:34", "throughput": 377.07, "total_tokens": 590624} {"current_steps": 470, "total_steps": 40000, "loss": 0.1394, "lr": 0.2998982492531373, "epoch": 0.022964356387266998, "percentage": 1.18, "elapsed_time": "0:26:09", "remaining_time": "1 day, 12:39:53", "throughput": 380.26, "total_tokens": 596768} {"current_steps": 475, "total_steps": 40000, "loss": 0.1382, "lr": 0.2998960684148887, "epoch": 0.023208658050961326, "percentage": 1.19, "elapsed_time": "0:26:12", "remaining_time": "1 day, 12:20:47", "throughput": 383.62, "total_tokens": 603232} {"current_steps": 480, "total_steps": 40000, "loss": 0.1694, "lr": 0.29989386446078264, "epoch": 0.023452959714655656, "percentage": 1.2, "elapsed_time": "0:26:15", "remaining_time": "1 day, 12:01:54", "throughput": 386.58, "total_tokens": 609056} {"current_steps": 485, "total_steps": 40000, "loss": 0.1389, "lr": 0.299891637391159, "epoch": 0.023697261378349987, "percentage": 1.21, "elapsed_time": "0:26:18", "remaining_time": "1 day, 11:43:41", "throughput": 390.02, "total_tokens": 615712} {"current_steps": 490, "total_steps": 40000, "loss": 0.144, "lr": 0.2998893872063612, "epoch": 0.023941563042044315, "percentage": 1.23, "elapsed_time": "0:26:21", "remaining_time": "1 day, 11:25:44", "throughput": 393.48, "total_tokens": 622400} {"current_steps": 495, "total_steps": 40000, "loss": 0.1302, "lr": 0.2998871139067363, "epoch": 0.024185864705738646, "percentage": 1.24, "elapsed_time": "0:26:24", "remaining_time": "1 day, 11:08:04", "throughput": 396.76, "total_tokens": 628800} {"current_steps": 500, "total_steps": 40000, "loss": 0.1235, "lr": 0.2998848174926348, "epoch": 0.024430166369432977, "percentage": 1.25, "elapsed_time": "0:26:28", "remaining_time": "1 day, 10:51:00", "throughput": 400.45, "total_tokens": 635968} {"current_steps": 505, "total_steps": 40000, "loss": 0.1589, "lr": 0.2998824979644109, "epoch": 0.024674468033127304, "percentage": 1.26, "elapsed_time": "0:26:31", "remaining_time": "1 day, 10:34:12", "throughput": 403.87, "total_tokens": 642688} {"current_steps": 510, "total_steps": 40000, "loss": 0.1443, "lr": 0.29988015532242224, "epoch": 0.024918769696821635, "percentage": 1.27, "elapsed_time": "0:26:34", "remaining_time": "1 day, 10:17:32", "throughput": 406.9, "total_tokens": 648736} {"current_steps": 515, "total_steps": 40000, "loss": 0.1427, "lr": 0.29987778956703015, "epoch": 0.025163071360515966, "percentage": 1.29, "elapsed_time": "0:26:37", "remaining_time": "1 day, 10:01:28", "throughput": 410.51, "total_tokens": 655840} {"current_steps": 520, "total_steps": 40000, "loss": 0.1343, "lr": 0.2998754006985994, "epoch": 0.025407373024210294, "percentage": 1.3, "elapsed_time": "0:26:40", "remaining_time": "1 day, 9:45:38", "throughput": 414.01, "total_tokens": 662752} {"current_steps": 525, "total_steps": 40000, "loss": 0.1679, "lr": 0.29987298871749846, "epoch": 0.025651674687904625, "percentage": 1.31, "elapsed_time": "0:26:43", "remaining_time": "1 day, 9:29:56", "throughput": 417.17, "total_tokens": 669088} {"current_steps": 530, "total_steps": 40000, "loss": 0.1519, "lr": 0.2998705536240992, "epoch": 0.025895976351598956, "percentage": 1.32, "elapsed_time": "0:26:46", "remaining_time": "1 day, 9:14:30", "throughput": 420.2, "total_tokens": 675232} {"current_steps": 535, "total_steps": 40000, "loss": 0.1846, "lr": 0.2998680954187772, "epoch": 0.026140278015293283, "percentage": 1.34, "elapsed_time": "0:26:49", "remaining_time": "1 day, 8:59:20", "throughput": 423.31, "total_tokens": 681504} {"current_steps": 540, "total_steps": 40000, "loss": 0.1521, "lr": 0.2998656141019115, "epoch": 0.026384579678987614, "percentage": 1.35, "elapsed_time": "0:26:53", "remaining_time": "1 day, 8:44:31", "throughput": 426.43, "total_tokens": 687840} {"current_steps": 545, "total_steps": 40000, "loss": 0.1414, "lr": 0.2998631096738848, "epoch": 0.026628881342681942, "percentage": 1.36, "elapsed_time": "0:26:56", "remaining_time": "1 day, 8:29:58", "throughput": 429.45, "total_tokens": 694048} {"current_steps": 550, "total_steps": 40000, "loss": 0.1577, "lr": 0.29986058213508326, "epoch": 0.026873183006376273, "percentage": 1.38, "elapsed_time": "0:26:59", "remaining_time": "1 day, 8:15:38", "throughput": 432.46, "total_tokens": 700224} {"current_steps": 555, "total_steps": 40000, "loss": 0.1515, "lr": 0.29985803148589674, "epoch": 0.027117484670070604, "percentage": 1.39, "elapsed_time": "0:27:02", "remaining_time": "1 day, 8:01:36", "throughput": 435.52, "total_tokens": 706528} {"current_steps": 560, "total_steps": 40000, "loss": 0.1663, "lr": 0.2998554577267185, "epoch": 0.02736178633376493, "percentage": 1.4, "elapsed_time": "0:27:05", "remaining_time": "1 day, 7:47:47", "throughput": 438.37, "total_tokens": 712480} {"current_steps": 565, "total_steps": 40000, "loss": 0.1421, "lr": 0.2998528608579455, "epoch": 0.027606087997459262, "percentage": 1.41, "elapsed_time": "0:27:08", "remaining_time": "1 day, 7:34:15", "throughput": 441.27, "total_tokens": 718560} {"current_steps": 570, "total_steps": 40000, "loss": 0.1343, "lr": 0.2998502408799781, "epoch": 0.027850389661153593, "percentage": 1.43, "elapsed_time": "0:27:11", "remaining_time": "1 day, 7:21:00", "throughput": 444.45, "total_tokens": 725120} {"current_steps": 575, "total_steps": 40000, "loss": 0.1675, "lr": 0.2998475977932205, "epoch": 0.02809469132484792, "percentage": 1.44, "elapsed_time": "0:27:14", "remaining_time": "1 day, 7:07:55", "throughput": 447.47, "total_tokens": 731424} {"current_steps": 580, "total_steps": 40000, "loss": 0.1371, "lr": 0.29984493159808023, "epoch": 0.028338992988542252, "percentage": 1.45, "elapsed_time": "0:27:17", "remaining_time": "1 day, 6:55:18", "throughput": 450.97, "total_tokens": 738624} {"current_steps": 585, "total_steps": 40000, "loss": 0.1639, "lr": 0.29984224229496836, "epoch": 0.028583294652236583, "percentage": 1.46, "elapsed_time": "0:27:20", "remaining_time": "1 day, 6:42:43", "throughput": 454.1, "total_tokens": 745184} {"current_steps": 590, "total_steps": 40000, "loss": 0.1487, "lr": 0.2998395298842998, "epoch": 0.02882759631593091, "percentage": 1.47, "elapsed_time": "0:27:24", "remaining_time": "1 day, 6:30:17", "throughput": 457.13, "total_tokens": 751552} {"current_steps": 595, "total_steps": 40000, "loss": 0.1472, "lr": 0.29983679436649263, "epoch": 0.02907189797962524, "percentage": 1.49, "elapsed_time": "0:27:27", "remaining_time": "1 day, 6:18:00", "throughput": 459.99, "total_tokens": 757632} {"current_steps": 600, "total_steps": 40000, "loss": 0.1286, "lr": 0.2998340357419689, "epoch": 0.029316199643319572, "percentage": 1.5, "elapsed_time": "0:27:30", "remaining_time": "1 day, 6:06:02", "throughput": 463.05, "total_tokens": 764128} {"current_steps": 600, "total_steps": 40000, "eval_loss": 0.15596766769886017, "epoch": 0.029316199643319572, "percentage": 1.5, "elapsed_time": "0:38:08", "remaining_time": "1 day, 17:44:40", "throughput": 333.89, "total_tokens": 764128} {"current_steps": 605, "total_steps": 40000, "loss": 0.1581, "lr": 0.29983125401115385, "epoch": 0.0295605013070139, "percentage": 1.51, "elapsed_time": "0:38:12", "remaining_time": "1 day, 17:27:37", "throughput": 336.04, "total_tokens": 770272} {"current_steps": 610, "total_steps": 40000, "loss": 0.1585, "lr": 0.29982844917447654, "epoch": 0.02980480297070823, "percentage": 1.52, "elapsed_time": "0:38:15", "remaining_time": "1 day, 17:10:19", "throughput": 338.48, "total_tokens": 776928} {"current_steps": 615, "total_steps": 40000, "loss": 0.1483, "lr": 0.2998256212323695, "epoch": 0.030049104634402562, "percentage": 1.54, "elapsed_time": "0:38:18", "remaining_time": "1 day, 16:53:15", "throughput": 340.78, "total_tokens": 783264} {"current_steps": 620, "total_steps": 40000, "loss": 0.1542, "lr": 0.29982277018526887, "epoch": 0.03029340629809689, "percentage": 1.55, "elapsed_time": "0:38:21", "remaining_time": "1 day, 16:36:27", "throughput": 343.15, "total_tokens": 789792} {"current_steps": 625, "total_steps": 40000, "loss": 0.1516, "lr": 0.2998198960336143, "epoch": 0.03053770796179122, "percentage": 1.56, "elapsed_time": "0:38:24", "remaining_time": "1 day, 16:19:55", "throughput": 345.41, "total_tokens": 796064} {"current_steps": 630, "total_steps": 40000, "loss": 0.1295, "lr": 0.299816998777849, "epoch": 0.030782009625485548, "percentage": 1.57, "elapsed_time": "0:38:27", "remaining_time": "1 day, 16:03:35", "throughput": 347.6, "total_tokens": 802176} {"current_steps": 635, "total_steps": 40000, "loss": 0.1159, "lr": 0.2998140784184197, "epoch": 0.03102631128917988, "percentage": 1.59, "elapsed_time": "0:38:30", "remaining_time": "1 day, 15:47:36", "throughput": 349.93, "total_tokens": 808640} {"current_steps": 640, "total_steps": 40000, "loss": 0.1351, "lr": 0.2998111349557769, "epoch": 0.031270612952874206, "percentage": 1.6, "elapsed_time": "0:38:34", "remaining_time": "1 day, 15:31:53", "throughput": 352.17, "total_tokens": 814944} {"current_steps": 645, "total_steps": 40000, "loss": 0.1257, "lr": 0.29980816839037444, "epoch": 0.03151491461656854, "percentage": 1.61, "elapsed_time": "0:38:37", "remaining_time": "1 day, 15:16:27", "throughput": 354.55, "total_tokens": 821568} {"current_steps": 650, "total_steps": 40000, "loss": 0.1278, "lr": 0.2998051787226698, "epoch": 0.03175921628026287, "percentage": 1.62, "elapsed_time": "0:38:40", "remaining_time": "1 day, 15:01:11", "throughput": 356.95, "total_tokens": 828256} {"current_steps": 655, "total_steps": 40000, "loss": 0.1251, "lr": 0.29980216595312403, "epoch": 0.0320035179439572, "percentage": 1.64, "elapsed_time": "0:38:43", "remaining_time": "1 day, 14:46:08", "throughput": 359.19, "total_tokens": 834560} {"current_steps": 660, "total_steps": 40000, "loss": 0.1259, "lr": 0.29979913008220177, "epoch": 0.03224781960765153, "percentage": 1.65, "elapsed_time": "0:38:46", "remaining_time": "1 day, 14:31:15", "throughput": 361.4, "total_tokens": 840800} {"current_steps": 665, "total_steps": 40000, "loss": 0.1381, "lr": 0.2997960711103711, "epoch": 0.03249212127134586, "percentage": 1.66, "elapsed_time": "0:38:49", "remaining_time": "1 day, 14:16:41", "throughput": 363.74, "total_tokens": 847392} {"current_steps": 670, "total_steps": 40000, "loss": 0.1085, "lr": 0.29979298903810386, "epoch": 0.032736422935040185, "percentage": 1.68, "elapsed_time": "0:38:52", "remaining_time": "1 day, 14:02:18", "throughput": 366.01, "total_tokens": 853824} {"current_steps": 675, "total_steps": 40000, "loss": 0.1643, "lr": 0.29978988386587524, "epoch": 0.032980724598734516, "percentage": 1.69, "elapsed_time": "0:38:55", "remaining_time": "1 day, 13:48:05", "throughput": 368.21, "total_tokens": 860096} {"current_steps": 680, "total_steps": 40000, "loss": 0.1435, "lr": 0.2997867555941642, "epoch": 0.03322502626242885, "percentage": 1.7, "elapsed_time": "0:38:58", "remaining_time": "1 day, 13:34:06", "throughput": 370.45, "total_tokens": 866464} {"current_steps": 685, "total_steps": 40000, "loss": 0.145, "lr": 0.299783604223453, "epoch": 0.03346932792612318, "percentage": 1.71, "elapsed_time": "0:39:01", "remaining_time": "1 day, 13:20:13", "throughput": 372.5, "total_tokens": 872384} {"current_steps": 690, "total_steps": 40000, "loss": 0.1327, "lr": 0.29978042975422786, "epoch": 0.03371362958981751, "percentage": 1.73, "elapsed_time": "0:39:05", "remaining_time": "1 day, 13:06:38", "throughput": 374.72, "total_tokens": 878720} {"current_steps": 695, "total_steps": 40000, "loss": 0.1598, "lr": 0.29977723218697816, "epoch": 0.03395793125351183, "percentage": 1.74, "elapsed_time": "0:39:08", "remaining_time": "1 day, 12:53:20", "throughput": 376.92, "total_tokens": 885088} {"current_steps": 700, "total_steps": 40000, "loss": 0.1195, "lr": 0.299774011522197, "epoch": 0.034202232917206164, "percentage": 1.75, "elapsed_time": "0:39:11", "remaining_time": "1 day, 12:40:09", "throughput": 379.17, "total_tokens": 891552} {"current_steps": 705, "total_steps": 40000, "loss": 0.1685, "lr": 0.29977076776038114, "epoch": 0.034446534580900495, "percentage": 1.76, "elapsed_time": "0:39:14", "remaining_time": "1 day, 12:27:04", "throughput": 381.3, "total_tokens": 897696} {"current_steps": 710, "total_steps": 40000, "loss": 0.1469, "lr": 0.2997675009020307, "epoch": 0.034690836244594826, "percentage": 1.77, "elapsed_time": "0:39:17", "remaining_time": "1 day, 12:14:08", "throughput": 383.33, "total_tokens": 903616} {"current_steps": 715, "total_steps": 40000, "loss": 0.1531, "lr": 0.2997642109476496, "epoch": 0.03493513790828916, "percentage": 1.79, "elapsed_time": "0:39:20", "remaining_time": "1 day, 12:01:29", "throughput": 385.55, "total_tokens": 910048} {"current_steps": 720, "total_steps": 40000, "loss": 0.1791, "lr": 0.299760897897745, "epoch": 0.03517943957198349, "percentage": 1.8, "elapsed_time": "0:39:23", "remaining_time": "1 day, 11:48:59", "throughput": 387.71, "total_tokens": 916320} {"current_steps": 725, "total_steps": 40000, "loss": 0.1121, "lr": 0.29975756175282803, "epoch": 0.03542374123567781, "percentage": 1.81, "elapsed_time": "0:39:26", "remaining_time": "1 day, 11:36:35", "throughput": 389.74, "total_tokens": 922304} {"current_steps": 730, "total_steps": 40000, "loss": 0.1414, "lr": 0.29975420251341306, "epoch": 0.03566804289937214, "percentage": 1.82, "elapsed_time": "0:39:29", "remaining_time": "1 day, 11:24:24", "throughput": 391.77, "total_tokens": 928288} {"current_steps": 735, "total_steps": 40000, "loss": 0.1567, "lr": 0.29975082018001814, "epoch": 0.035912344563066474, "percentage": 1.84, "elapsed_time": "0:39:32", "remaining_time": "1 day, 11:12:24", "throughput": 393.82, "total_tokens": 934336} {"current_steps": 740, "total_steps": 40000, "loss": 0.1479, "lr": 0.2997474147531648, "epoch": 0.036156646226760805, "percentage": 1.85, "elapsed_time": "0:39:35", "remaining_time": "1 day, 11:00:34", "throughput": 395.83, "total_tokens": 940320} {"current_steps": 745, "total_steps": 40000, "loss": 0.1496, "lr": 0.29974398623337833, "epoch": 0.036400947890455136, "percentage": 1.86, "elapsed_time": "0:39:38", "remaining_time": "1 day, 10:48:52", "throughput": 397.98, "total_tokens": 946656} {"current_steps": 750, "total_steps": 40000, "loss": 0.1486, "lr": 0.2997405346211873, "epoch": 0.03664524955414947, "percentage": 1.88, "elapsed_time": "0:39:41", "remaining_time": "1 day, 10:37:23", "throughput": 400.17, "total_tokens": 953088} {"current_steps": 755, "total_steps": 40000, "loss": 0.1319, "lr": 0.2997370599171241, "epoch": 0.03688955121784379, "percentage": 1.89, "elapsed_time": "0:39:44", "remaining_time": "1 day, 10:25:58", "throughput": 402.25, "total_tokens": 959264} {"current_steps": 760, "total_steps": 40000, "loss": 0.1277, "lr": 0.2997335621217246, "epoch": 0.03713385288153812, "percentage": 1.9, "elapsed_time": "0:39:47", "remaining_time": "1 day, 10:14:50", "throughput": 404.43, "total_tokens": 965728} {"current_steps": 765, "total_steps": 40000, "loss": 0.1177, "lr": 0.29973004123552816, "epoch": 0.03737815454523245, "percentage": 1.91, "elapsed_time": "0:39:50", "remaining_time": "1 day, 10:03:45", "throughput": 406.54, "total_tokens": 972000} {"current_steps": 770, "total_steps": 40000, "loss": 0.1394, "lr": 0.2997264972590777, "epoch": 0.037622456208926784, "percentage": 1.93, "elapsed_time": "0:39:53", "remaining_time": "1 day, 9:52:49", "throughput": 408.61, "total_tokens": 978208} {"current_steps": 775, "total_steps": 40000, "loss": 0.1097, "lr": 0.29972293019291973, "epoch": 0.037866757872621115, "percentage": 1.94, "elapsed_time": "0:39:57", "remaining_time": "1 day, 9:42:04", "throughput": 410.79, "total_tokens": 984704} {"current_steps": 780, "total_steps": 40000, "loss": 0.148, "lr": 0.2997193400376045, "epoch": 0.03811105953631544, "percentage": 1.95, "elapsed_time": "0:40:00", "remaining_time": "1 day, 9:31:27", "throughput": 412.87, "total_tokens": 990976} {"current_steps": 785, "total_steps": 40000, "loss": 0.1561, "lr": 0.2997157267936854, "epoch": 0.03835536120000977, "percentage": 1.96, "elapsed_time": "0:40:03", "remaining_time": "1 day, 9:20:55", "throughput": 414.92, "total_tokens": 997152} {"current_steps": 790, "total_steps": 40000, "loss": 0.1645, "lr": 0.2997120904617199, "epoch": 0.0385996628637041, "percentage": 1.98, "elapsed_time": "0:40:06", "remaining_time": "1 day, 9:10:37", "throughput": 417.09, "total_tokens": 1003680} {"current_steps": 795, "total_steps": 40000, "loss": 0.1426, "lr": 0.29970843104226863, "epoch": 0.03884396452739843, "percentage": 1.99, "elapsed_time": "0:40:09", "remaining_time": "1 day, 9:00:23", "throughput": 419.13, "total_tokens": 1009888} {"current_steps": 800, "total_steps": 40000, "loss": 0.1539, "lr": 0.2997047485358959, "epoch": 0.03908826619109276, "percentage": 2.0, "elapsed_time": "0:40:12", "remaining_time": "1 day, 8:50:16", "throughput": 421.19, "total_tokens": 1016160} {"current_steps": 800, "total_steps": 40000, "eval_loss": 0.14764031767845154, "epoch": 0.03908826619109276, "percentage": 2.0, "elapsed_time": "0:50:50", "remaining_time": "1 day, 17:31:38", "throughput": 333.06, "total_tokens": 1016160} {"current_steps": 805, "total_steps": 40000, "loss": 0.1695, "lr": 0.2997010429431697, "epoch": 0.039332567854787094, "percentage": 2.01, "elapsed_time": "0:50:54", "remaining_time": "1 day, 17:18:59", "throughput": 334.56, "total_tokens": 1022048} {"current_steps": 810, "total_steps": 40000, "loss": 0.1557, "lr": 0.29969731426466134, "epoch": 0.03957686951848142, "percentage": 2.02, "elapsed_time": "0:50:57", "remaining_time": "1 day, 17:05:52", "throughput": 336.35, "total_tokens": 1028544} {"current_steps": 815, "total_steps": 40000, "loss": 0.1246, "lr": 0.299693562500946, "epoch": 0.03982117118217575, "percentage": 2.04, "elapsed_time": "0:51:01", "remaining_time": "1 day, 16:52:54", "throughput": 338.12, "total_tokens": 1035008} {"current_steps": 820, "total_steps": 40000, "loss": 0.1188, "lr": 0.29968978765260207, "epoch": 0.04006547284587008, "percentage": 2.05, "elapsed_time": "0:51:04", "remaining_time": "1 day, 16:40:02", "throughput": 339.83, "total_tokens": 1041248} {"current_steps": 825, "total_steps": 40000, "loss": 0.1541, "lr": 0.2996859897202118, "epoch": 0.04030977450956441, "percentage": 2.06, "elapsed_time": "0:51:07", "remaining_time": "1 day, 16:27:23", "throughput": 341.64, "total_tokens": 1047872} {"current_steps": 830, "total_steps": 40000, "loss": 0.1175, "lr": 0.2996821687043609, "epoch": 0.04055407617325874, "percentage": 2.08, "elapsed_time": "0:51:10", "remaining_time": "1 day, 16:14:57", "throughput": 343.47, "total_tokens": 1054560} {"current_steps": 835, "total_steps": 40000, "loss": 0.1107, "lr": 0.2996783246056384, "epoch": 0.04079837783695307, "percentage": 2.09, "elapsed_time": "0:51:13", "remaining_time": "1 day, 16:02:36", "throughput": 345.19, "total_tokens": 1060928} {"current_steps": 840, "total_steps": 40000, "loss": 0.1586, "lr": 0.29967445742463744, "epoch": 0.0410426795006474, "percentage": 2.1, "elapsed_time": "0:51:16", "remaining_time": "1 day, 15:50:22", "throughput": 346.88, "total_tokens": 1067168} {"current_steps": 845, "total_steps": 40000, "loss": 0.1234, "lr": 0.29967056716195417, "epoch": 0.04128698116434173, "percentage": 2.11, "elapsed_time": "0:51:19", "remaining_time": "1 day, 15:38:17", "throughput": 348.64, "total_tokens": 1073664} {"current_steps": 850, "total_steps": 40000, "loss": 0.1839, "lr": 0.2996666538181885, "epoch": 0.04153128282803606, "percentage": 2.12, "elapsed_time": "0:51:22", "remaining_time": "1 day, 15:26:20", "throughput": 350.3, "total_tokens": 1079840} {"current_steps": 855, "total_steps": 40000, "loss": 0.1688, "lr": 0.29966271739394407, "epoch": 0.04177558449173039, "percentage": 2.14, "elapsed_time": "0:51:25", "remaining_time": "1 day, 15:14:32", "throughput": 351.9, "total_tokens": 1085856} {"current_steps": 860, "total_steps": 40000, "loss": 0.1511, "lr": 0.29965875788982776, "epoch": 0.04201988615542472, "percentage": 2.15, "elapsed_time": "0:51:28", "remaining_time": "1 day, 15:02:53", "throughput": 353.56, "total_tokens": 1092064} {"current_steps": 865, "total_steps": 40000, "loss": 0.1497, "lr": 0.2996547753064503, "epoch": 0.042264187819119045, "percentage": 2.16, "elapsed_time": "0:51:31", "remaining_time": "1 day, 14:51:18", "throughput": 355.11, "total_tokens": 1097920} {"current_steps": 870, "total_steps": 40000, "loss": 0.1179, "lr": 0.29965076964442583, "epoch": 0.042508489482813376, "percentage": 2.17, "elapsed_time": "0:51:34", "remaining_time": "1 day, 14:39:56", "throughput": 356.79, "total_tokens": 1104192} {"current_steps": 875, "total_steps": 40000, "loss": 0.1382, "lr": 0.299646740904372, "epoch": 0.04275279114650771, "percentage": 2.19, "elapsed_time": "0:51:37", "remaining_time": "1 day, 14:28:40", "throughput": 358.44, "total_tokens": 1110400} {"current_steps": 880, "total_steps": 40000, "loss": 0.1165, "lr": 0.29964268908691016, "epoch": 0.04299709281020204, "percentage": 2.2, "elapsed_time": "0:51:41", "remaining_time": "1 day, 14:17:33", "throughput": 360.12, "total_tokens": 1116736} {"current_steps": 885, "total_steps": 40000, "loss": 0.1684, "lr": 0.29963861419266513, "epoch": 0.04324139447389637, "percentage": 2.21, "elapsed_time": "0:51:44", "remaining_time": "1 day, 14:06:30", "throughput": 361.73, "total_tokens": 1122816} {"current_steps": 890, "total_steps": 40000, "loss": 0.1176, "lr": 0.29963451622226533, "epoch": 0.0434856961375907, "percentage": 2.23, "elapsed_time": "0:51:47", "remaining_time": "1 day, 13:55:43", "throughput": 363.56, "total_tokens": 1129664} {"current_steps": 895, "total_steps": 40000, "loss": 0.1254, "lr": 0.29963039517634277, "epoch": 0.043729997801285024, "percentage": 2.24, "elapsed_time": "0:51:50", "remaining_time": "1 day, 13:44:57", "throughput": 365.21, "total_tokens": 1135904} {"current_steps": 900, "total_steps": 40000, "loss": 0.1614, "lr": 0.2996262510555328, "epoch": 0.043974299464979355, "percentage": 2.25, "elapsed_time": "0:51:53", "remaining_time": "1 day, 13:34:22", "throughput": 366.96, "total_tokens": 1142528} {"current_steps": 905, "total_steps": 40000, "loss": 0.1515, "lr": 0.2996220838604746, "epoch": 0.044218601128673686, "percentage": 2.26, "elapsed_time": "0:51:56", "remaining_time": "1 day, 13:23:49", "throughput": 368.57, "total_tokens": 1148640} {"current_steps": 910, "total_steps": 40000, "loss": 0.163, "lr": 0.29961789359181085, "epoch": 0.04446290279236802, "percentage": 2.27, "elapsed_time": "0:51:59", "remaining_time": "1 day, 13:13:22", "throughput": 370.15, "total_tokens": 1154688} {"current_steps": 915, "total_steps": 40000, "loss": 0.151, "lr": 0.29961368025018764, "epoch": 0.04470720445606235, "percentage": 2.29, "elapsed_time": "0:52:02", "remaining_time": "1 day, 13:03:06", "throughput": 371.82, "total_tokens": 1161056} {"current_steps": 920, "total_steps": 40000, "loss": 0.1506, "lr": 0.2996094438362548, "epoch": 0.04495150611975668, "percentage": 2.3, "elapsed_time": "0:52:05", "remaining_time": "1 day, 12:52:56", "throughput": 373.48, "total_tokens": 1167392} {"current_steps": 925, "total_steps": 40000, "loss": 0.1206, "lr": 0.2996051843506657, "epoch": 0.045195807783451, "percentage": 2.31, "elapsed_time": "0:52:08", "remaining_time": "1 day, 12:42:56", "throughput": 375.23, "total_tokens": 1174080} {"current_steps": 930, "total_steps": 40000, "loss": 0.1403, "lr": 0.299600901794077, "epoch": 0.045440109447145334, "percentage": 2.33, "elapsed_time": "0:52:11", "remaining_time": "1 day, 12:32:55", "throughput": 376.77, "total_tokens": 1180032} {"current_steps": 935, "total_steps": 40000, "loss": 0.1016, "lr": 0.29959659616714923, "epoch": 0.045684411110839665, "percentage": 2.34, "elapsed_time": "0:52:15", "remaining_time": "1 day, 12:23:03", "throughput": 378.43, "total_tokens": 1186368} {"current_steps": 940, "total_steps": 40000, "loss": 0.1497, "lr": 0.2995922674705464, "epoch": 0.045928712774533996, "percentage": 2.35, "elapsed_time": "0:52:18", "remaining_time": "1 day, 12:13:16", "throughput": 380.01, "total_tokens": 1192480} {"current_steps": 945, "total_steps": 40000, "loss": 0.1184, "lr": 0.2995879157049361, "epoch": 0.04617301443822833, "percentage": 2.36, "elapsed_time": "0:52:21", "remaining_time": "1 day, 12:03:34", "throughput": 381.68, "total_tokens": 1198880} {"current_steps": 950, "total_steps": 40000, "loss": 0.134, "lr": 0.2995835408709893, "epoch": 0.04641731610192265, "percentage": 2.38, "elapsed_time": "0:52:24", "remaining_time": "1 day, 11:53:58", "throughput": 383.19, "total_tokens": 1204768} {"current_steps": 955, "total_steps": 40000, "loss": 0.1561, "lr": 0.29957914296938076, "epoch": 0.04666161776561698, "percentage": 2.39, "elapsed_time": "0:52:27", "remaining_time": "1 day, 11:44:33", "throughput": 384.85, "total_tokens": 1211200} {"current_steps": 960, "total_steps": 40000, "loss": 0.1557, "lr": 0.2995747220007886, "epoch": 0.04690591942931131, "percentage": 2.4, "elapsed_time": "0:52:30", "remaining_time": "1 day, 11:35:12", "throughput": 386.5, "total_tokens": 1217600} {"current_steps": 965, "total_steps": 40000, "loss": 0.1172, "lr": 0.2995702779658947, "epoch": 0.047150221093005644, "percentage": 2.41, "elapsed_time": "0:52:33", "remaining_time": "1 day, 11:25:58", "throughput": 388.13, "total_tokens": 1223936} {"current_steps": 970, "total_steps": 40000, "loss": 0.0967, "lr": 0.29956581086538425, "epoch": 0.047394522756699975, "percentage": 2.43, "elapsed_time": "0:52:36", "remaining_time": "1 day, 11:16:50", "throughput": 389.82, "total_tokens": 1230496} {"current_steps": 975, "total_steps": 40000, "loss": 0.1123, "lr": 0.2995613206999462, "epoch": 0.047638824420394306, "percentage": 2.44, "elapsed_time": "0:52:39", "remaining_time": "1 day, 11:07:46", "throughput": 391.52, "total_tokens": 1237056} {"current_steps": 980, "total_steps": 40000, "loss": 0.0948, "lr": 0.29955680747027297, "epoch": 0.04788312608408863, "percentage": 2.45, "elapsed_time": "0:52:42", "remaining_time": "1 day, 10:58:51", "throughput": 393.25, "total_tokens": 1243776} {"current_steps": 985, "total_steps": 40000, "loss": 0.1648, "lr": 0.2995522711770607, "epoch": 0.04812742774778296, "percentage": 2.46, "elapsed_time": "0:52:45", "remaining_time": "1 day, 10:49:57", "throughput": 394.8, "total_tokens": 1249888} {"current_steps": 990, "total_steps": 40000, "loss": 0.1001, "lr": 0.2995477118210087, "epoch": 0.04837172941147729, "percentage": 2.48, "elapsed_time": "0:52:48", "remaining_time": "1 day, 10:41:10", "throughput": 396.41, "total_tokens": 1256224} {"current_steps": 995, "total_steps": 40000, "loss": 0.1699, "lr": 0.29954312940282024, "epoch": 0.04861603107517162, "percentage": 2.49, "elapsed_time": "0:52:51", "remaining_time": "1 day, 10:32:22", "throughput": 397.85, "total_tokens": 1261952} {"current_steps": 1000, "total_steps": 40000, "loss": 0.1205, "lr": 0.29953852392320196, "epoch": 0.048860332738865954, "percentage": 2.5, "elapsed_time": "0:52:55", "remaining_time": "1 day, 10:23:47", "throughput": 399.48, "total_tokens": 1268384} {"current_steps": 1000, "total_steps": 40000, "eval_loss": 0.13077235221862793, "epoch": 0.048860332738865954, "percentage": 2.5, "elapsed_time": "1:03:33", "remaining_time": "1 day, 17:18:42", "throughput": 332.61, "total_tokens": 1268384} {"current_steps": 1005, "total_steps": 40000, "loss": 0.127, "lr": 0.2995338953828641, "epoch": 0.049104634402560285, "percentage": 2.51, "elapsed_time": "1:03:37", "remaining_time": "1 day, 17:08:24", "throughput": 333.96, "total_tokens": 1274752} {"current_steps": 1010, "total_steps": 40000, "loss": 0.1263, "lr": 0.2995292437825204, "epoch": 0.04934893606625461, "percentage": 2.53, "elapsed_time": "1:03:40", "remaining_time": "1 day, 16:57:50", "throughput": 335.35, "total_tokens": 1281056} {"current_steps": 1015, "total_steps": 40000, "loss": 0.147, "lr": 0.29952456912288816, "epoch": 0.04959323772994894, "percentage": 2.54, "elapsed_time": "1:03:43", "remaining_time": "1 day, 16:47:21", "throughput": 336.73, "total_tokens": 1287360} {"current_steps": 1020, "total_steps": 40000, "loss": 0.1525, "lr": 0.2995198714046884, "epoch": 0.04983753939364327, "percentage": 2.55, "elapsed_time": "1:03:46", "remaining_time": "1 day, 16:37:04", "throughput": 338.2, "total_tokens": 1294048} {"current_steps": 1025, "total_steps": 40000, "loss": 0.1132, "lr": 0.2995151506286454, "epoch": 0.0500818410573376, "percentage": 2.56, "elapsed_time": "1:03:49", "remaining_time": "1 day, 16:26:52", "throughput": 339.63, "total_tokens": 1300608} {"current_steps": 1030, "total_steps": 40000, "loss": 0.1382, "lr": 0.2995104067954873, "epoch": 0.05032614272103193, "percentage": 2.57, "elapsed_time": "1:03:52", "remaining_time": "1 day, 16:16:44", "throughput": 341.02, "total_tokens": 1306976} {"current_steps": 1035, "total_steps": 40000, "loss": 0.1318, "lr": 0.2995056399059456, "epoch": 0.05057044438472626, "percentage": 2.59, "elapsed_time": "1:03:55", "remaining_time": "1 day, 16:06:33", "throughput": 342.24, "total_tokens": 1312640} {"current_steps": 1040, "total_steps": 40000, "loss": 0.1371, "lr": 0.2995008499607554, "epoch": 0.05081474604842059, "percentage": 2.6, "elapsed_time": "1:03:58", "remaining_time": "1 day, 15:56:36", "throughput": 343.62, "total_tokens": 1318976} {"current_steps": 1045, "total_steps": 40000, "loss": 0.1643, "lr": 0.2994960369606554, "epoch": 0.05105904771211492, "percentage": 2.61, "elapsed_time": "1:04:01", "remaining_time": "1 day, 15:46:42", "throughput": 344.93, "total_tokens": 1325056} {"current_steps": 1050, "total_steps": 40000, "loss": 0.137, "lr": 0.2994912009063878, "epoch": 0.05130334937580925, "percentage": 2.62, "elapsed_time": "1:04:04", "remaining_time": "1 day, 15:36:57", "throughput": 346.31, "total_tokens": 1331456} {"current_steps": 1055, "total_steps": 40000, "loss": 0.153, "lr": 0.29948634179869843, "epoch": 0.05154765103950358, "percentage": 2.64, "elapsed_time": "1:04:07", "remaining_time": "1 day, 15:27:14", "throughput": 347.57, "total_tokens": 1337344} {"current_steps": 1060, "total_steps": 40000, "loss": 0.1301, "lr": 0.29948145963833656, "epoch": 0.05179195270319791, "percentage": 2.65, "elapsed_time": "1:04:10", "remaining_time": "1 day, 15:17:36", "throughput": 348.87, "total_tokens": 1343360} {"current_steps": 1065, "total_steps": 40000, "loss": 0.1375, "lr": 0.29947655442605514, "epoch": 0.052036254366892236, "percentage": 2.66, "elapsed_time": "1:04:13", "remaining_time": "1 day, 15:08:10", "throughput": 350.36, "total_tokens": 1350208} {"current_steps": 1070, "total_steps": 40000, "loss": 0.1091, "lr": 0.2994716261626106, "epoch": 0.05228055603058657, "percentage": 2.67, "elapsed_time": "1:04:16", "remaining_time": "1 day, 14:58:49", "throughput": 351.73, "total_tokens": 1356608} {"current_steps": 1075, "total_steps": 40000, "loss": 0.1991, "lr": 0.2994666748487629, "epoch": 0.0525248576942809, "percentage": 2.69, "elapsed_time": "1:04:20", "remaining_time": "1 day, 14:49:33", "throughput": 353.11, "total_tokens": 1363040} {"current_steps": 1080, "total_steps": 40000, "loss": 0.1267, "lr": 0.2994617004852756, "epoch": 0.05276915935797523, "percentage": 2.7, "elapsed_time": "1:04:23", "remaining_time": "1 day, 14:40:16", "throughput": 354.43, "total_tokens": 1369216} {"current_steps": 1085, "total_steps": 40000, "loss": 0.1254, "lr": 0.2994567030729159, "epoch": 0.05301346102166956, "percentage": 2.71, "elapsed_time": "1:04:26", "remaining_time": "1 day, 14:31:06", "throughput": 355.76, "total_tokens": 1375424} {"current_steps": 1090, "total_steps": 40000, "loss": 0.1455, "lr": 0.29945168261245436, "epoch": 0.053257762685363884, "percentage": 2.73, "elapsed_time": "1:04:29", "remaining_time": "1 day, 14:22:01", "throughput": 357.07, "total_tokens": 1381600} {"current_steps": 1095, "total_steps": 40000, "loss": 0.1394, "lr": 0.29944663910466524, "epoch": 0.053502064349058215, "percentage": 2.74, "elapsed_time": "1:04:32", "remaining_time": "1 day, 14:13:01", "throughput": 358.35, "total_tokens": 1387648} {"current_steps": 1100, "total_steps": 40000, "loss": 0.1177, "lr": 0.2994415725503263, "epoch": 0.053746366012752546, "percentage": 2.75, "elapsed_time": "1:04:35", "remaining_time": "1 day, 14:04:06", "throughput": 359.66, "total_tokens": 1393824} {"current_steps": 1105, "total_steps": 40000, "loss": 0.138, "lr": 0.29943648295021885, "epoch": 0.05399066767644688, "percentage": 2.76, "elapsed_time": "1:04:38", "remaining_time": "1 day, 13:55:16", "throughput": 360.96, "total_tokens": 1399936} {"current_steps": 1110, "total_steps": 40000, "loss": 0.139, "lr": 0.2994313703051278, "epoch": 0.05423496934014121, "percentage": 2.77, "elapsed_time": "1:04:41", "remaining_time": "1 day, 13:46:29", "throughput": 362.31, "total_tokens": 1406272} {"current_steps": 1115, "total_steps": 40000, "loss": 0.1479, "lr": 0.29942623461584156, "epoch": 0.05447927100383554, "percentage": 2.79, "elapsed_time": "1:04:44", "remaining_time": "1 day, 13:37:52", "throughput": 363.7, "total_tokens": 1412800} {"current_steps": 1120, "total_steps": 40000, "loss": 0.1104, "lr": 0.29942107588315214, "epoch": 0.05472357266752986, "percentage": 2.8, "elapsed_time": "1:04:47", "remaining_time": "1 day, 13:29:16", "throughput": 365.02, "total_tokens": 1419072} {"current_steps": 1125, "total_steps": 40000, "loss": 0.1447, "lr": 0.29941589410785513, "epoch": 0.054967874331224194, "percentage": 2.81, "elapsed_time": "1:04:50", "remaining_time": "1 day, 13:20:43", "throughput": 366.21, "total_tokens": 1424800} {"current_steps": 1130, "total_steps": 40000, "loss": 0.1317, "lr": 0.29941068929074954, "epoch": 0.055212175994918525, "percentage": 2.83, "elapsed_time": "1:04:53", "remaining_time": "1 day, 13:12:16", "throughput": 367.57, "total_tokens": 1431200} {"current_steps": 1135, "total_steps": 40000, "loss": 0.1388, "lr": 0.2994054614326381, "epoch": 0.055456477658612856, "percentage": 2.84, "elapsed_time": "1:04:56", "remaining_time": "1 day, 13:03:53", "throughput": 368.88, "total_tokens": 1437440} {"current_steps": 1140, "total_steps": 40000, "loss": 0.1453, "lr": 0.29940021053432686, "epoch": 0.05570077932230719, "percentage": 2.85, "elapsed_time": "1:04:59", "remaining_time": "1 day, 12:55:34", "throughput": 370.16, "total_tokens": 1443552} {"current_steps": 1145, "total_steps": 40000, "loss": 0.1276, "lr": 0.29939493659662575, "epoch": 0.05594508098600152, "percentage": 2.86, "elapsed_time": "1:05:02", "remaining_time": "1 day, 12:47:22", "throughput": 371.57, "total_tokens": 1450176} {"current_steps": 1150, "total_steps": 40000, "loss": 0.1242, "lr": 0.299389639620348, "epoch": 0.05618938264969584, "percentage": 2.88, "elapsed_time": "1:05:05", "remaining_time": "1 day, 12:39:13", "throughput": 372.93, "total_tokens": 1456672} {"current_steps": 1155, "total_steps": 40000, "loss": 0.1102, "lr": 0.29938431960631046, "epoch": 0.05643368431339017, "percentage": 2.89, "elapsed_time": "1:05:09", "remaining_time": "1 day, 12:31:07", "throughput": 374.17, "total_tokens": 1462624} {"current_steps": 1160, "total_steps": 40000, "loss": 0.1329, "lr": 0.2993789765553335, "epoch": 0.056677985977084504, "percentage": 2.9, "elapsed_time": "1:05:12", "remaining_time": "1 day, 12:23:10", "throughput": 375.59, "total_tokens": 1469376} {"current_steps": 1165, "total_steps": 40000, "loss": 0.0931, "lr": 0.2993736104682412, "epoch": 0.056922287640778835, "percentage": 2.91, "elapsed_time": "1:05:15", "remaining_time": "1 day, 12:15:19", "throughput": 377.09, "total_tokens": 1476448} {"current_steps": 1170, "total_steps": 40000, "loss": 0.1539, "lr": 0.299368221345861, "epoch": 0.057166589304473166, "percentage": 2.93, "elapsed_time": "1:05:18", "remaining_time": "1 day, 12:07:26", "throughput": 378.38, "total_tokens": 1482688} {"current_steps": 1175, "total_steps": 40000, "loss": 0.1558, "lr": 0.29936280918902397, "epoch": 0.05741089096816749, "percentage": 2.94, "elapsed_time": "1:05:21", "remaining_time": "1 day, 11:59:35", "throughput": 379.61, "total_tokens": 1488640} {"current_steps": 1180, "total_steps": 40000, "loss": 0.1415, "lr": 0.2993573739985648, "epoch": 0.05765519263186182, "percentage": 2.95, "elapsed_time": "1:05:24", "remaining_time": "1 day, 11:51:46", "throughput": 380.84, "total_tokens": 1494560} {"current_steps": 1185, "total_steps": 40000, "loss": 0.1294, "lr": 0.2993519157753216, "epoch": 0.05789949429555615, "percentage": 2.96, "elapsed_time": "1:05:27", "remaining_time": "1 day, 11:44:08", "throughput": 382.22, "total_tokens": 1501184} {"current_steps": 1190, "total_steps": 40000, "loss": 0.138, "lr": 0.2993464345201361, "epoch": 0.05814379595925048, "percentage": 2.97, "elapsed_time": "1:05:30", "remaining_time": "1 day, 11:36:34", "throughput": 383.59, "total_tokens": 1507808} {"current_steps": 1195, "total_steps": 40000, "loss": 0.1368, "lr": 0.2993409302338536, "epoch": 0.058388097622944814, "percentage": 2.99, "elapsed_time": "1:05:33", "remaining_time": "1 day, 11:28:58", "throughput": 384.82, "total_tokens": 1513760} {"current_steps": 1200, "total_steps": 40000, "loss": 0.1145, "lr": 0.2993354029173229, "epoch": 0.058632399286639145, "percentage": 3.0, "elapsed_time": "1:05:36", "remaining_time": "1 day, 11:21:30", "throughput": 386.2, "total_tokens": 1520384} {"current_steps": 1200, "total_steps": 40000, "eval_loss": 0.1469876915216446, "epoch": 0.058632399286639145, "percentage": 3.0, "elapsed_time": "1:16:15", "remaining_time": "1 day, 17:05:32", "throughput": 332.31, "total_tokens": 1520384} {"current_steps": 1205, "total_steps": 40000, "loss": 0.1373, "lr": 0.2993298525713965, "epoch": 0.05887670095033347, "percentage": 3.01, "elapsed_time": "1:16:18", "remaining_time": "1 day, 16:57:00", "throughput": 333.44, "total_tokens": 1526816} {"current_steps": 1210, "total_steps": 40000, "loss": 0.1281, "lr": 0.29932427919693017, "epoch": 0.0591210026140278, "percentage": 3.02, "elapsed_time": "1:16:22", "remaining_time": "1 day, 16:48:13", "throughput": 334.63, "total_tokens": 1533312} {"current_steps": 1215, "total_steps": 40000, "loss": 0.1478, "lr": 0.2993186827947834, "epoch": 0.05936530427772213, "percentage": 3.04, "elapsed_time": "1:16:25", "remaining_time": "1 day, 16:39:24", "throughput": 335.72, "total_tokens": 1539296} {"current_steps": 1220, "total_steps": 40000, "loss": 0.1264, "lr": 0.2993130633658194, "epoch": 0.05960960594141646, "percentage": 3.05, "elapsed_time": "1:16:28", "remaining_time": "1 day, 16:30:44", "throughput": 336.91, "total_tokens": 1545792} {"current_steps": 1225, "total_steps": 40000, "loss": 0.1049, "lr": 0.29930742091090456, "epoch": 0.05985390760511079, "percentage": 3.06, "elapsed_time": "1:16:31", "remaining_time": "1 day, 16:22:06", "throughput": 338.04, "total_tokens": 1552032} {"current_steps": 1230, "total_steps": 40000, "loss": 0.1296, "lr": 0.29930175543090914, "epoch": 0.060098209268805124, "percentage": 3.08, "elapsed_time": "1:16:34", "remaining_time": "1 day, 16:13:33", "throughput": 339.2, "total_tokens": 1558400} {"current_steps": 1235, "total_steps": 40000, "loss": 0.1101, "lr": 0.2992960669267068, "epoch": 0.06034251093249945, "percentage": 3.09, "elapsed_time": "1:16:37", "remaining_time": "1 day, 16:05:03", "throughput": 340.31, "total_tokens": 1564512} {"current_steps": 1240, "total_steps": 40000, "loss": 0.1566, "lr": 0.29929035539917476, "epoch": 0.06058681259619378, "percentage": 3.1, "elapsed_time": "1:16:40", "remaining_time": "1 day, 15:56:39", "throughput": 341.47, "total_tokens": 1570880} {"current_steps": 1245, "total_steps": 40000, "loss": 0.1104, "lr": 0.2992846208491938, "epoch": 0.06083111425988811, "percentage": 3.11, "elapsed_time": "1:16:43", "remaining_time": "1 day, 15:48:19", "throughput": 342.62, "total_tokens": 1577248} {"current_steps": 1250, "total_steps": 40000, "loss": 0.1129, "lr": 0.2992788632776483, "epoch": 0.06107541592358244, "percentage": 3.12, "elapsed_time": "1:16:46", "remaining_time": "1 day, 15:40:02", "throughput": 343.76, "total_tokens": 1583520} {"current_steps": 1255, "total_steps": 40000, "loss": 0.18, "lr": 0.29927308268542613, "epoch": 0.06131971758727677, "percentage": 3.14, "elapsed_time": "1:16:49", "remaining_time": "1 day, 15:31:47", "throughput": 344.82, "total_tokens": 1589472} {"current_steps": 1260, "total_steps": 40000, "loss": 0.1479, "lr": 0.2992672790734187, "epoch": 0.061564019250971096, "percentage": 3.15, "elapsed_time": "1:16:52", "remaining_time": "1 day, 15:23:38", "throughput": 345.91, "total_tokens": 1595552} {"current_steps": 1265, "total_steps": 40000, "loss": 0.1402, "lr": 0.299261452442521, "epoch": 0.06180832091466543, "percentage": 3.16, "elapsed_time": "1:16:55", "remaining_time": "1 day, 15:15:34", "throughput": 347.04, "total_tokens": 1601824} {"current_steps": 1270, "total_steps": 40000, "loss": 0.1415, "lr": 0.29925560279363167, "epoch": 0.06205262257835976, "percentage": 3.17, "elapsed_time": "1:16:58", "remaining_time": "1 day, 15:07:32", "throughput": 348.13, "total_tokens": 1607904} {"current_steps": 1275, "total_steps": 40000, "loss": 0.1444, "lr": 0.29924973012765266, "epoch": 0.06229692424205409, "percentage": 3.19, "elapsed_time": "1:17:01", "remaining_time": "1 day, 14:59:36", "throughput": 349.25, "total_tokens": 1614176} {"current_steps": 1280, "total_steps": 40000, "loss": 0.1045, "lr": 0.29924383444548974, "epoch": 0.06254122590574841, "percentage": 3.2, "elapsed_time": "1:17:04", "remaining_time": "1 day, 14:51:42", "throughput": 350.36, "total_tokens": 1620352} {"current_steps": 1285, "total_steps": 40000, "loss": 0.1009, "lr": 0.299237915748052, "epoch": 0.06278552756944275, "percentage": 3.21, "elapsed_time": "1:17:07", "remaining_time": "1 day, 14:43:50", "throughput": 351.43, "total_tokens": 1626400} {"current_steps": 1290, "total_steps": 40000, "loss": 0.1044, "lr": 0.2992319740362522, "epoch": 0.06302982923313707, "percentage": 3.23, "elapsed_time": "1:17:11", "remaining_time": "1 day, 14:36:05", "throughput": 352.61, "total_tokens": 1632928} {"current_steps": 1295, "total_steps": 40000, "loss": 0.1105, "lr": 0.2992260093110066, "epoch": 0.06327413089683141, "percentage": 3.24, "elapsed_time": "1:17:14", "remaining_time": "1 day, 14:28:27", "throughput": 353.82, "total_tokens": 1639680} {"current_steps": 1300, "total_steps": 40000, "loss": 0.1381, "lr": 0.2992200215732352, "epoch": 0.06351843256052574, "percentage": 3.25, "elapsed_time": "1:17:17", "remaining_time": "1 day, 14:20:45", "throughput": 354.88, "total_tokens": 1645632} {"current_steps": 1305, "total_steps": 40000, "loss": 0.141, "lr": 0.2992140108238611, "epoch": 0.06376273422422006, "percentage": 3.26, "elapsed_time": "1:17:20", "remaining_time": "1 day, 14:13:09", "throughput": 356.0, "total_tokens": 1651936} {"current_steps": 1310, "total_steps": 40000, "loss": 0.1466, "lr": 0.2992079770638115, "epoch": 0.0640070358879144, "percentage": 3.28, "elapsed_time": "1:17:23", "remaining_time": "1 day, 14:05:39", "throughput": 357.18, "total_tokens": 1658528} {"current_steps": 1315, "total_steps": 40000, "loss": 0.1285, "lr": 0.29920192029401677, "epoch": 0.06425133755160872, "percentage": 3.29, "elapsed_time": "1:17:26", "remaining_time": "1 day, 13:58:09", "throughput": 358.26, "total_tokens": 1664640} {"current_steps": 1320, "total_steps": 40000, "loss": 0.1122, "lr": 0.2991958405154109, "epoch": 0.06449563921530306, "percentage": 3.3, "elapsed_time": "1:17:29", "remaining_time": "1 day, 13:50:45", "throughput": 359.43, "total_tokens": 1671200} {"current_steps": 1325, "total_steps": 40000, "loss": 0.1233, "lr": 0.29918973772893154, "epoch": 0.06473994087899738, "percentage": 3.31, "elapsed_time": "1:17:32", "remaining_time": "1 day, 13:43:25", "throughput": 360.62, "total_tokens": 1677824} {"current_steps": 1330, "total_steps": 40000, "loss": 0.0954, "lr": 0.29918361193551973, "epoch": 0.06498424254269172, "percentage": 3.33, "elapsed_time": "1:17:35", "remaining_time": "1 day, 13:36:05", "throughput": 361.75, "total_tokens": 1684224} {"current_steps": 1335, "total_steps": 40000, "loss": 0.1136, "lr": 0.29917746313612026, "epoch": 0.06522854420638605, "percentage": 3.34, "elapsed_time": "1:17:38", "remaining_time": "1 day, 13:28:50", "throughput": 362.88, "total_tokens": 1690592} {"current_steps": 1340, "total_steps": 40000, "loss": 0.0938, "lr": 0.29917129133168124, "epoch": 0.06547284587008037, "percentage": 3.35, "elapsed_time": "1:17:41", "remaining_time": "1 day, 13:21:39", "throughput": 364.01, "total_tokens": 1696992} {"current_steps": 1345, "total_steps": 40000, "loss": 0.1013, "lr": 0.2991650965231546, "epoch": 0.06571714753377471, "percentage": 3.36, "elapsed_time": "1:17:45", "remaining_time": "1 day, 13:14:32", "throughput": 365.17, "total_tokens": 1703552} {"current_steps": 1350, "total_steps": 40000, "loss": 0.1041, "lr": 0.29915887871149544, "epoch": 0.06596144919746903, "percentage": 3.38, "elapsed_time": "1:17:48", "remaining_time": "1 day, 13:07:28", "throughput": 366.29, "total_tokens": 1709920} {"current_steps": 1355, "total_steps": 40000, "loss": 0.13, "lr": 0.2991526378976628, "epoch": 0.06620575086116337, "percentage": 3.39, "elapsed_time": "1:17:51", "remaining_time": "1 day, 13:00:24", "throughput": 367.32, "total_tokens": 1715840} {"current_steps": 1360, "total_steps": 40000, "loss": 0.1458, "lr": 0.29914637408261896, "epoch": 0.0664500525248577, "percentage": 3.4, "elapsed_time": "1:17:54", "remaining_time": "1 day, 12:53:22", "throughput": 368.36, "total_tokens": 1721792} {"current_steps": 1365, "total_steps": 40000, "loss": 0.1373, "lr": 0.29914008726733, "epoch": 0.06669435418855202, "percentage": 3.41, "elapsed_time": "1:17:57", "remaining_time": "1 day, 12:46:24", "throughput": 369.43, "total_tokens": 1727904} {"current_steps": 1370, "total_steps": 40000, "loss": 0.1309, "lr": 0.2991337774527653, "epoch": 0.06693865585224636, "percentage": 3.43, "elapsed_time": "1:18:00", "remaining_time": "1 day, 12:39:36", "throughput": 370.7, "total_tokens": 1735072} {"current_steps": 1375, "total_steps": 40000, "loss": 0.113, "lr": 0.2991274446398981, "epoch": 0.06718295751594068, "percentage": 3.44, "elapsed_time": "1:18:03", "remaining_time": "1 day, 12:32:45", "throughput": 371.83, "total_tokens": 1741504} {"current_steps": 1380, "total_steps": 40000, "loss": 0.1465, "lr": 0.29912108882970484, "epoch": 0.06742725917963502, "percentage": 3.45, "elapsed_time": "1:18:06", "remaining_time": "1 day, 12:25:59", "throughput": 373.02, "total_tokens": 1748224} {"current_steps": 1385, "total_steps": 40000, "loss": 0.1165, "lr": 0.2991147100231657, "epoch": 0.06767156084332934, "percentage": 3.46, "elapsed_time": "1:18:09", "remaining_time": "1 day, 12:19:16", "throughput": 374.19, "total_tokens": 1754880} {"current_steps": 1390, "total_steps": 40000, "loss": 0.1448, "lr": 0.2991083082212644, "epoch": 0.06791586250702367, "percentage": 3.48, "elapsed_time": "1:18:12", "remaining_time": "1 day, 12:12:32", "throughput": 375.2, "total_tokens": 1760768} {"current_steps": 1395, "total_steps": 40000, "loss": 0.1255, "lr": 0.2991018834249881, "epoch": 0.068160164170718, "percentage": 3.49, "elapsed_time": "1:18:15", "remaining_time": "1 day, 12:05:54", "throughput": 376.33, "total_tokens": 1767200} {"current_steps": 1400, "total_steps": 40000, "loss": 0.1343, "lr": 0.29909543563532764, "epoch": 0.06840446583441233, "percentage": 3.5, "elapsed_time": "1:18:18", "remaining_time": "1 day, 11:59:17", "throughput": 377.4, "total_tokens": 1773408} {"current_steps": 1400, "total_steps": 40000, "eval_loss": 0.12485729157924652, "epoch": 0.06840446583441233, "percentage": 3.5, "elapsed_time": "1:28:57", "remaining_time": "1 day, 16:52:41", "throughput": 332.26, "total_tokens": 1773408} {"current_steps": 1405, "total_steps": 40000, "loss": 0.1415, "lr": 0.29908896485327746, "epoch": 0.06864876749810667, "percentage": 3.51, "elapsed_time": "1:29:01", "remaining_time": "1 day, 16:45:23", "throughput": 333.25, "total_tokens": 1780000} {"current_steps": 1410, "total_steps": 40000, "loss": 0.1142, "lr": 0.29908247107983527, "epoch": 0.06889306916180099, "percentage": 3.52, "elapsed_time": "1:29:04", "remaining_time": "1 day, 16:37:52", "throughput": 334.35, "total_tokens": 1786912} {"current_steps": 1415, "total_steps": 40000, "loss": 0.101, "lr": 0.29907595431600253, "epoch": 0.06913737082549533, "percentage": 3.54, "elapsed_time": "1:29:07", "remaining_time": "1 day, 16:30:20", "throughput": 335.34, "total_tokens": 1793248} {"current_steps": 1420, "total_steps": 40000, "loss": 0.137, "lr": 0.29906941456278424, "epoch": 0.06938167248918965, "percentage": 3.55, "elapsed_time": "1:29:10", "remaining_time": "1 day, 16:22:50", "throughput": 336.28, "total_tokens": 1799296} {"current_steps": 1425, "total_steps": 40000, "loss": 0.1311, "lr": 0.2990628518211889, "epoch": 0.06962597415288398, "percentage": 3.56, "elapsed_time": "1:29:13", "remaining_time": "1 day, 16:15:23", "throughput": 337.26, "total_tokens": 1805536} {"current_steps": 1430, "total_steps": 40000, "loss": 0.1254, "lr": 0.2990562660922286, "epoch": 0.06987027581657831, "percentage": 3.57, "elapsed_time": "1:29:16", "remaining_time": "1 day, 16:07:58", "throughput": 338.16, "total_tokens": 1811392} {"current_steps": 1435, "total_steps": 40000, "loss": 0.1222, "lr": 0.2990496573769189, "epoch": 0.07011457748027264, "percentage": 3.59, "elapsed_time": "1:29:19", "remaining_time": "1 day, 16:00:38", "throughput": 339.14, "total_tokens": 1817696} {"current_steps": 1440, "total_steps": 40000, "loss": 0.1473, "lr": 0.29904302567627894, "epoch": 0.07035887914396698, "percentage": 3.6, "elapsed_time": "1:29:22", "remaining_time": "1 day, 15:53:22", "throughput": 340.12, "total_tokens": 1823968} {"current_steps": 1445, "total_steps": 40000, "loss": 0.1155, "lr": 0.2990363709913314, "epoch": 0.0706031808076613, "percentage": 3.61, "elapsed_time": "1:29:25", "remaining_time": "1 day, 15:46:11", "throughput": 341.18, "total_tokens": 1830720} {"current_steps": 1450, "total_steps": 40000, "loss": 0.1166, "lr": 0.29902969332310264, "epoch": 0.07084748247135562, "percentage": 3.62, "elapsed_time": "1:29:29", "remaining_time": "1 day, 15:39:03", "throughput": 342.2, "total_tokens": 1837280} {"current_steps": 1455, "total_steps": 40000, "loss": 0.1136, "lr": 0.2990229926726223, "epoch": 0.07109178413504996, "percentage": 3.64, "elapsed_time": "1:29:32", "remaining_time": "1 day, 15:32:00", "throughput": 343.31, "total_tokens": 1844352} {"current_steps": 1460, "total_steps": 40000, "loss": 0.1089, "lr": 0.29901626904092365, "epoch": 0.07133608579874429, "percentage": 3.65, "elapsed_time": "1:29:35", "remaining_time": "1 day, 15:24:52", "throughput": 344.14, "total_tokens": 1849824} {"current_steps": 1465, "total_steps": 40000, "loss": 0.1028, "lr": 0.2990095224290438, "epoch": 0.07158038746243862, "percentage": 3.66, "elapsed_time": "1:29:38", "remaining_time": "1 day, 15:17:52", "throughput": 345.17, "total_tokens": 1856480} {"current_steps": 1470, "total_steps": 40000, "loss": 0.1264, "lr": 0.29900275283802297, "epoch": 0.07182468912613295, "percentage": 3.67, "elapsed_time": "1:29:41", "remaining_time": "1 day, 15:10:55", "throughput": 346.19, "total_tokens": 1863040} {"current_steps": 1475, "total_steps": 40000, "loss": 0.1225, "lr": 0.2989959602689051, "epoch": 0.07206899078982727, "percentage": 3.69, "elapsed_time": "1:29:44", "remaining_time": "1 day, 15:04:01", "throughput": 347.23, "total_tokens": 1869728} {"current_steps": 1480, "total_steps": 40000, "loss": 0.1233, "lr": 0.2989891447227379, "epoch": 0.07231329245352161, "percentage": 3.7, "elapsed_time": "1:29:47", "remaining_time": "1 day, 14:57:06", "throughput": 348.17, "total_tokens": 1875840} {"current_steps": 1485, "total_steps": 40000, "loss": 0.1131, "lr": 0.29898230620057215, "epoch": 0.07255759411721593, "percentage": 3.71, "elapsed_time": "1:29:50", "remaining_time": "1 day, 14:50:16", "throughput": 349.15, "total_tokens": 1882208} {"current_steps": 1490, "total_steps": 40000, "loss": 0.1081, "lr": 0.2989754447034626, "epoch": 0.07280189578091027, "percentage": 3.72, "elapsed_time": "1:29:53", "remaining_time": "1 day, 14:43:26", "throughput": 350.13, "total_tokens": 1888544} {"current_steps": 1495, "total_steps": 40000, "loss": 0.0986, "lr": 0.2989685602324673, "epoch": 0.0730461974446046, "percentage": 3.74, "elapsed_time": "1:29:56", "remaining_time": "1 day, 14:36:40", "throughput": 351.04, "total_tokens": 1894496} {"current_steps": 1500, "total_steps": 40000, "loss": 0.0971, "lr": 0.298961652788648, "epoch": 0.07329049910829893, "percentage": 3.75, "elapsed_time": "1:30:00", "remaining_time": "1 day, 14:30:01", "throughput": 352.11, "total_tokens": 1901408} {"current_steps": 1505, "total_steps": 40000, "loss": 0.0832, "lr": 0.29895472237306986, "epoch": 0.07353480077199326, "percentage": 3.76, "elapsed_time": "1:30:03", "remaining_time": "1 day, 14:23:20", "throughput": 353.04, "total_tokens": 1907520} {"current_steps": 1510, "total_steps": 40000, "loss": 0.1203, "lr": 0.29894776898680164, "epoch": 0.07377910243568758, "percentage": 3.77, "elapsed_time": "1:30:06", "remaining_time": "1 day, 14:16:44", "throughput": 354.06, "total_tokens": 1914144} {"current_steps": 1515, "total_steps": 40000, "loss": 0.1071, "lr": 0.29894079263091566, "epoch": 0.07402340409938192, "percentage": 3.79, "elapsed_time": "1:30:09", "remaining_time": "1 day, 14:10:09", "throughput": 355.01, "total_tokens": 1920352} {"current_steps": 1520, "total_steps": 40000, "loss": 0.0968, "lr": 0.2989337933064877, "epoch": 0.07426770576307624, "percentage": 3.8, "elapsed_time": "1:30:12", "remaining_time": "1 day, 14:03:40", "throughput": 356.02, "total_tokens": 1926944} {"current_steps": 1525, "total_steps": 40000, "loss": 0.0879, "lr": 0.29892677101459725, "epoch": 0.07451200742677058, "percentage": 3.81, "elapsed_time": "1:30:15", "remaining_time": "1 day, 13:57:11", "throughput": 356.99, "total_tokens": 1933280} {"current_steps": 1530, "total_steps": 40000, "loss": 0.1003, "lr": 0.2989197257563272, "epoch": 0.0747563090904649, "percentage": 3.82, "elapsed_time": "1:30:18", "remaining_time": "1 day, 13:50:44", "throughput": 357.94, "total_tokens": 1939520} {"current_steps": 1535, "total_steps": 40000, "loss": 0.0799, "lr": 0.2989126575327639, "epoch": 0.07500061075415923, "percentage": 3.84, "elapsed_time": "1:30:21", "remaining_time": "1 day, 13:44:19", "throughput": 358.89, "total_tokens": 1945792} {"current_steps": 1540, "total_steps": 40000, "loss": 0.1791, "lr": 0.29890556634499754, "epoch": 0.07524491241785357, "percentage": 3.85, "elapsed_time": "1:30:24", "remaining_time": "1 day, 13:37:58", "throughput": 359.89, "total_tokens": 1952320} {"current_steps": 1545, "total_steps": 40000, "loss": 0.1092, "lr": 0.2988984521941216, "epoch": 0.07548921408154789, "percentage": 3.86, "elapsed_time": "1:30:27", "remaining_time": "1 day, 13:31:40", "throughput": 360.95, "total_tokens": 1959200} {"current_steps": 1550, "total_steps": 40000, "loss": 0.096, "lr": 0.29889131508123307, "epoch": 0.07573351574524223, "percentage": 3.88, "elapsed_time": "1:30:31", "remaining_time": "1 day, 13:25:24", "throughput": 361.9, "total_tokens": 1965504} {"current_steps": 1555, "total_steps": 40000, "loss": 0.1167, "lr": 0.2988841550074327, "epoch": 0.07597781740893655, "percentage": 3.89, "elapsed_time": "1:30:34", "remaining_time": "1 day, 13:19:09", "throughput": 362.85, "total_tokens": 1971776} {"current_steps": 1560, "total_steps": 40000, "loss": 0.0925, "lr": 0.2988769719738246, "epoch": 0.07622211907263088, "percentage": 3.9, "elapsed_time": "1:30:37", "remaining_time": "1 day, 13:13:00", "throughput": 363.88, "total_tokens": 1978528} {"current_steps": 1565, "total_steps": 40000, "loss": 0.1082, "lr": 0.29886976598151666, "epoch": 0.07646642073632522, "percentage": 3.91, "elapsed_time": "1:30:40", "remaining_time": "1 day, 13:06:51", "throughput": 364.83, "total_tokens": 1984832} {"current_steps": 1570, "total_steps": 40000, "loss": 0.1133, "lr": 0.29886253703161986, "epoch": 0.07671072240001954, "percentage": 3.92, "elapsed_time": "1:30:43", "remaining_time": "1 day, 13:00:41", "throughput": 365.74, "total_tokens": 1990848} {"current_steps": 1575, "total_steps": 40000, "loss": 0.0978, "lr": 0.29885528512524917, "epoch": 0.07695502406371388, "percentage": 3.94, "elapsed_time": "1:30:46", "remaining_time": "1 day, 12:54:33", "throughput": 366.62, "total_tokens": 1996736} {"current_steps": 1580, "total_steps": 40000, "loss": 0.0882, "lr": 0.29884801026352287, "epoch": 0.0771993257274082, "percentage": 3.95, "elapsed_time": "1:30:49", "remaining_time": "1 day, 12:48:30", "throughput": 367.57, "total_tokens": 2003040} {"current_steps": 1585, "total_steps": 40000, "loss": 0.1148, "lr": 0.2988407124475629, "epoch": 0.07744362739110254, "percentage": 3.96, "elapsed_time": "1:30:52", "remaining_time": "1 day, 12:42:30", "throughput": 368.49, "total_tokens": 2009216} {"current_steps": 1590, "total_steps": 40000, "loss": 0.1015, "lr": 0.2988333916784945, "epoch": 0.07768792905479686, "percentage": 3.98, "elapsed_time": "1:30:55", "remaining_time": "1 day, 12:36:34", "throughput": 369.48, "total_tokens": 2015744} {"current_steps": 1595, "total_steps": 40000, "loss": 0.1031, "lr": 0.2988260479574468, "epoch": 0.07793223071849119, "percentage": 3.99, "elapsed_time": "1:30:58", "remaining_time": "1 day, 12:30:37", "throughput": 370.4, "total_tokens": 2021920} {"current_steps": 1600, "total_steps": 40000, "loss": 0.0713, "lr": 0.2988186812855523, "epoch": 0.07817653238218553, "percentage": 4.0, "elapsed_time": "1:31:01", "remaining_time": "1 day, 12:24:45", "throughput": 371.39, "total_tokens": 2028480} {"current_steps": 1600, "total_steps": 40000, "eval_loss": 0.10532558709383011, "epoch": 0.07817653238218553, "percentage": 4.0, "elapsed_time": "1:41:41", "remaining_time": "1 day, 16:40:25", "throughput": 332.48, "total_tokens": 2028480} {"current_steps": 1605, "total_steps": 40000, "loss": 0.0972, "lr": 0.29881129166394693, "epoch": 0.07842083404587985, "percentage": 4.01, "elapsed_time": "1:41:44", "remaining_time": "1 day, 16:33:59", "throughput": 333.31, "total_tokens": 2034784} {"current_steps": 1610, "total_steps": 40000, "loss": 0.1036, "lr": 0.29880387909377026, "epoch": 0.07866513570957419, "percentage": 4.03, "elapsed_time": "1:41:47", "remaining_time": "1 day, 16:27:20", "throughput": 334.17, "total_tokens": 2041056} {"current_steps": 1615, "total_steps": 40000, "loss": 0.0995, "lr": 0.2987964435761655, "epoch": 0.07890943737326851, "percentage": 4.04, "elapsed_time": "1:41:50", "remaining_time": "1 day, 16:20:43", "throughput": 335.04, "total_tokens": 2047424} {"current_steps": 1620, "total_steps": 40000, "loss": 0.1021, "lr": 0.29878898511227925, "epoch": 0.07915373903696284, "percentage": 4.05, "elapsed_time": "1:41:53", "remaining_time": "1 day, 16:14:07", "throughput": 335.9, "total_tokens": 2053664} {"current_steps": 1625, "total_steps": 40000, "loss": 0.1033, "lr": 0.2987815037032617, "epoch": 0.07939804070065717, "percentage": 4.06, "elapsed_time": "1:41:56", "remaining_time": "1 day, 16:07:34", "throughput": 336.72, "total_tokens": 2059712} {"current_steps": 1630, "total_steps": 40000, "loss": 0.0858, "lr": 0.29877399935026655, "epoch": 0.0796423423643515, "percentage": 4.08, "elapsed_time": "1:41:59", "remaining_time": "1 day, 16:01:03", "throughput": 337.54, "total_tokens": 2065728} {"current_steps": 1635, "total_steps": 40000, "loss": 0.1168, "lr": 0.2987664720544511, "epoch": 0.07988664402804584, "percentage": 4.09, "elapsed_time": "1:42:03", "remaining_time": "1 day, 15:54:35", "throughput": 338.4, "total_tokens": 2072000} {"current_steps": 1640, "total_steps": 40000, "loss": 0.0702, "lr": 0.2987589218169761, "epoch": 0.08013094569174016, "percentage": 4.1, "elapsed_time": "1:42:06", "remaining_time": "1 day, 15:48:11", "throughput": 339.3, "total_tokens": 2078624} {"current_steps": 1645, "total_steps": 40000, "loss": 0.0829, "lr": 0.29875134863900604, "epoch": 0.08037524735543448, "percentage": 4.11, "elapsed_time": "1:42:09", "remaining_time": "1 day, 15:41:50", "throughput": 340.2, "total_tokens": 2085152} {"current_steps": 1650, "total_steps": 40000, "loss": 0.0804, "lr": 0.29874375252170865, "epoch": 0.08061954901912882, "percentage": 4.12, "elapsed_time": "1:42:12", "remaining_time": "1 day, 15:35:27", "throughput": 340.98, "total_tokens": 2090976} {"current_steps": 1655, "total_steps": 40000, "loss": 0.1094, "lr": 0.2987361334662553, "epoch": 0.08086385068282315, "percentage": 4.14, "elapsed_time": "1:42:15", "remaining_time": "1 day, 15:29:13", "throughput": 341.93, "total_tokens": 2097888} {"current_steps": 1660, "total_steps": 40000, "loss": 0.0935, "lr": 0.29872849147382113, "epoch": 0.08110815234651748, "percentage": 4.15, "elapsed_time": "1:42:18", "remaining_time": "1 day, 15:22:58", "throughput": 342.85, "total_tokens": 2104576} {"current_steps": 1665, "total_steps": 40000, "loss": 0.0991, "lr": 0.2987208265455845, "epoch": 0.08135245401021181, "percentage": 4.16, "elapsed_time": "1:42:21", "remaining_time": "1 day, 15:16:43", "throughput": 343.65, "total_tokens": 2110528} {"current_steps": 1670, "total_steps": 40000, "loss": 0.1139, "lr": 0.29871313868272753, "epoch": 0.08159675567390615, "percentage": 4.17, "elapsed_time": "1:42:24", "remaining_time": "1 day, 15:10:33", "throughput": 344.57, "total_tokens": 2117280} {"current_steps": 1675, "total_steps": 40000, "loss": 0.1261, "lr": 0.29870542788643567, "epoch": 0.08184105733760047, "percentage": 4.19, "elapsed_time": "1:42:27", "remaining_time": "1 day, 15:04:26", "throughput": 345.44, "total_tokens": 2123712} {"current_steps": 1680, "total_steps": 40000, "loss": 0.1138, "lr": 0.2986976941578981, "epoch": 0.0820853590012948, "percentage": 4.2, "elapsed_time": "1:42:30", "remaining_time": "1 day, 14:58:20", "throughput": 346.28, "total_tokens": 2129984} {"current_steps": 1685, "total_steps": 40000, "loss": 0.1111, "lr": 0.29868993749830747, "epoch": 0.08232966066498913, "percentage": 4.21, "elapsed_time": "1:42:34", "remaining_time": "1 day, 14:52:16", "throughput": 347.12, "total_tokens": 2136224} {"current_steps": 1690, "total_steps": 40000, "loss": 0.0755, "lr": 0.2986821579088598, "epoch": 0.08257396232868346, "percentage": 4.23, "elapsed_time": "1:42:37", "remaining_time": "1 day, 14:46:15", "throughput": 347.99, "total_tokens": 2142656} {"current_steps": 1695, "total_steps": 40000, "loss": 0.1068, "lr": 0.29867435539075504, "epoch": 0.0828182639923778, "percentage": 4.24, "elapsed_time": "1:42:40", "remaining_time": "1 day, 14:40:15", "throughput": 348.83, "total_tokens": 2148928} {"current_steps": 1700, "total_steps": 40000, "loss": 0.0826, "lr": 0.2986665299451963, "epoch": 0.08306256565607212, "percentage": 4.25, "elapsed_time": "1:42:43", "remaining_time": "1 day, 14:34:17", "throughput": 349.67, "total_tokens": 2155136} {"current_steps": 1705, "total_steps": 40000, "loss": 0.1112, "lr": 0.29865868157339037, "epoch": 0.08330686731976644, "percentage": 4.26, "elapsed_time": "1:42:46", "remaining_time": "1 day, 14:28:20", "throughput": 350.48, "total_tokens": 2161216} {"current_steps": 1710, "total_steps": 40000, "loss": 0.0642, "lr": 0.2986508102765476, "epoch": 0.08355116898346078, "percentage": 4.28, "elapsed_time": "1:42:49", "remaining_time": "1 day, 14:22:29", "throughput": 351.41, "total_tokens": 2168096} {"current_steps": 1715, "total_steps": 40000, "loss": 0.0848, "lr": 0.2986429160558818, "epoch": 0.0837954706471551, "percentage": 4.29, "elapsed_time": "1:42:52", "remaining_time": "1 day, 14:16:36", "throughput": 352.24, "total_tokens": 2174272} {"current_steps": 1720, "total_steps": 40000, "loss": 0.0723, "lr": 0.2986349989126104, "epoch": 0.08403977231084944, "percentage": 4.3, "elapsed_time": "1:42:55", "remaining_time": "1 day, 14:10:49", "throughput": 353.18, "total_tokens": 2181184} {"current_steps": 1725, "total_steps": 40000, "loss": 0.0924, "lr": 0.29862705884795426, "epoch": 0.08428407397454377, "percentage": 4.31, "elapsed_time": "1:42:58", "remaining_time": "1 day, 14:05:01", "throughput": 354.04, "total_tokens": 2187584} {"current_steps": 1730, "total_steps": 40000, "loss": 0.1107, "lr": 0.2986190958631379, "epoch": 0.08452837563823809, "percentage": 4.32, "elapsed_time": "1:43:01", "remaining_time": "1 day, 13:59:14", "throughput": 354.87, "total_tokens": 2193824} {"current_steps": 1735, "total_steps": 40000, "loss": 0.1064, "lr": 0.29861110995938933, "epoch": 0.08477267730193243, "percentage": 4.34, "elapsed_time": "1:43:05", "remaining_time": "1 day, 13:53:30", "throughput": 355.75, "total_tokens": 2200352} {"current_steps": 1740, "total_steps": 40000, "loss": 0.1365, "lr": 0.29860310113794, "epoch": 0.08501697896562675, "percentage": 4.35, "elapsed_time": "1:43:08", "remaining_time": "1 day, 13:47:47", "throughput": 356.58, "total_tokens": 2206560} {"current_steps": 1745, "total_steps": 40000, "loss": 0.1001, "lr": 0.29859506940002506, "epoch": 0.08526128062932109, "percentage": 4.36, "elapsed_time": "1:43:11", "remaining_time": "1 day, 13:42:07", "throughput": 357.46, "total_tokens": 2213088} {"current_steps": 1750, "total_steps": 40000, "loss": 0.106, "lr": 0.298587014746883, "epoch": 0.08550558229301541, "percentage": 4.38, "elapsed_time": "1:43:14", "remaining_time": "1 day, 13:36:29", "throughput": 358.29, "total_tokens": 2219360} {"current_steps": 1755, "total_steps": 40000, "loss": 0.0731, "lr": 0.298578937179756, "epoch": 0.08574988395670975, "percentage": 4.39, "elapsed_time": "1:43:17", "remaining_time": "1 day, 13:30:53", "throughput": 359.1, "total_tokens": 2225504} {"current_steps": 1760, "total_steps": 40000, "loss": 0.0981, "lr": 0.29857083669988976, "epoch": 0.08599418562040408, "percentage": 4.4, "elapsed_time": "1:43:20", "remaining_time": "1 day, 13:25:17", "throughput": 359.87, "total_tokens": 2231360} {"current_steps": 1765, "total_steps": 40000, "loss": 0.046, "lr": 0.29856271330853346, "epoch": 0.0862384872840984, "percentage": 4.41, "elapsed_time": "1:43:23", "remaining_time": "1 day, 13:19:44", "throughput": 360.72, "total_tokens": 2237728} {"current_steps": 1770, "total_steps": 40000, "loss": 0.0967, "lr": 0.2985545670069398, "epoch": 0.08648278894779274, "percentage": 4.42, "elapsed_time": "1:43:26", "remaining_time": "1 day, 13:14:14", "throughput": 361.52, "total_tokens": 2243808} {"current_steps": 1775, "total_steps": 40000, "loss": 0.1534, "lr": 0.29854639779636505, "epoch": 0.08672709061148706, "percentage": 4.44, "elapsed_time": "1:43:29", "remaining_time": "1 day, 13:08:45", "throughput": 362.38, "total_tokens": 2250272} {"current_steps": 1780, "total_steps": 40000, "loss": 0.1203, "lr": 0.298538205678069, "epoch": 0.0869713922751814, "percentage": 4.45, "elapsed_time": "1:43:32", "remaining_time": "1 day, 13:03:18", "throughput": 363.19, "total_tokens": 2256416} {"current_steps": 1785, "total_steps": 40000, "loss": 0.1966, "lr": 0.298529990653315, "epoch": 0.08721569393887572, "percentage": 4.46, "elapsed_time": "1:43:35", "remaining_time": "1 day, 12:57:53", "throughput": 364.01, "total_tokens": 2262592} {"current_steps": 1790, "total_steps": 40000, "loss": 0.1667, "lr": 0.29852175272336984, "epoch": 0.08745999560257005, "percentage": 4.47, "elapsed_time": "1:43:38", "remaining_time": "1 day, 12:52:29", "throughput": 364.8, "total_tokens": 2268640} {"current_steps": 1795, "total_steps": 40000, "loss": 0.1397, "lr": 0.29851349188950405, "epoch": 0.08770429726626439, "percentage": 4.49, "elapsed_time": "1:43:41", "remaining_time": "1 day, 12:47:07", "throughput": 365.61, "total_tokens": 2274784} {"current_steps": 1800, "total_steps": 40000, "loss": 0.1344, "lr": 0.2985052081529914, "epoch": 0.08794859892995871, "percentage": 4.5, "elapsed_time": "1:43:44", "remaining_time": "1 day, 12:41:46", "throughput": 366.42, "total_tokens": 2280960} {"current_steps": 1800, "total_steps": 40000, "eval_loss": 0.1333623230457306, "epoch": 0.08794859892995871, "percentage": 4.5, "elapsed_time": "1:54:23", "remaining_time": "1 day, 16:27:37", "throughput": 332.33, "total_tokens": 2280960} {"current_steps": 1805, "total_steps": 40000, "loss": 0.1421, "lr": 0.29849690151510944, "epoch": 0.08819290059365305, "percentage": 4.51, "elapsed_time": "1:54:27", "remaining_time": "1 day, 16:21:52", "throughput": 333.04, "total_tokens": 2287008} {"current_steps": 1810, "total_steps": 40000, "loss": 0.191, "lr": 0.2984885719771392, "epoch": 0.08843720225734737, "percentage": 4.52, "elapsed_time": "1:54:30", "remaining_time": "1 day, 16:15:56", "throughput": 333.77, "total_tokens": 2293024} {"current_steps": 1815, "total_steps": 40000, "loss": 0.1444, "lr": 0.2984802195403651, "epoch": 0.0886815039210417, "percentage": 4.54, "elapsed_time": "1:54:33", "remaining_time": "1 day, 16:10:03", "throughput": 334.55, "total_tokens": 2299424} {"current_steps": 1820, "total_steps": 40000, "loss": 0.109, "lr": 0.2984718442060752, "epoch": 0.08892580558473603, "percentage": 4.55, "elapsed_time": "1:54:36", "remaining_time": "1 day, 16:04:12", "throughput": 335.33, "total_tokens": 2305856} {"current_steps": 1825, "total_steps": 40000, "loss": 0.1076, "lr": 0.2984634459755611, "epoch": 0.08917010724843036, "percentage": 4.56, "elapsed_time": "1:54:39", "remaining_time": "1 day, 15:58:24", "throughput": 336.13, "total_tokens": 2312416} {"current_steps": 1830, "total_steps": 40000, "loss": 0.1247, "lr": 0.29845502485011793, "epoch": 0.0894144089121247, "percentage": 4.58, "elapsed_time": "1:54:42", "remaining_time": "1 day, 15:52:36", "throughput": 336.87, "total_tokens": 2318560} {"current_steps": 1835, "total_steps": 40000, "loss": 0.14, "lr": 0.2984465808310444, "epoch": 0.08965871057581902, "percentage": 4.59, "elapsed_time": "1:54:45", "remaining_time": "1 day, 15:46:50", "throughput": 337.67, "total_tokens": 2325056} {"current_steps": 1840, "total_steps": 40000, "loss": 0.1167, "lr": 0.29843811391964253, "epoch": 0.08990301223951336, "percentage": 4.6, "elapsed_time": "1:54:48", "remaining_time": "1 day, 15:41:05", "throughput": 338.46, "total_tokens": 2331584} {"current_steps": 1845, "total_steps": 40000, "loss": 0.1176, "lr": 0.2984296241172182, "epoch": 0.09014731390320768, "percentage": 4.61, "elapsed_time": "1:54:51", "remaining_time": "1 day, 15:35:24", "throughput": 339.27, "total_tokens": 2338208} {"current_steps": 1850, "total_steps": 40000, "loss": 0.1032, "lr": 0.29842111142508043, "epoch": 0.090391615566902, "percentage": 4.62, "elapsed_time": "1:54:54", "remaining_time": "1 day, 15:29:43", "throughput": 340.01, "total_tokens": 2344288} {"current_steps": 1855, "total_steps": 40000, "loss": 0.1302, "lr": 0.29841257584454217, "epoch": 0.09063591723059634, "percentage": 4.64, "elapsed_time": "1:54:57", "remaining_time": "1 day, 15:24:01", "throughput": 340.72, "total_tokens": 2350240} {"current_steps": 1860, "total_steps": 40000, "loss": 0.1049, "lr": 0.29840401737691963, "epoch": 0.09088021889429067, "percentage": 4.65, "elapsed_time": "1:55:00", "remaining_time": "1 day, 15:18:27", "throughput": 341.54, "total_tokens": 2356992} {"current_steps": 1865, "total_steps": 40000, "loss": 0.1149, "lr": 0.29839543602353263, "epoch": 0.091124520557985, "percentage": 4.66, "elapsed_time": "1:55:04", "remaining_time": "1 day, 15:12:51", "throughput": 342.27, "total_tokens": 2363040} {"current_steps": 1870, "total_steps": 40000, "loss": 0.0978, "lr": 0.2983868317857046, "epoch": 0.09136882222167933, "percentage": 4.67, "elapsed_time": "1:55:07", "remaining_time": "1 day, 15:07:18", "throughput": 343.02, "total_tokens": 2369280} {"current_steps": 1875, "total_steps": 40000, "loss": 0.0939, "lr": 0.2983782046647623, "epoch": 0.09161312388537365, "percentage": 4.69, "elapsed_time": "1:55:10", "remaining_time": "1 day, 15:01:48", "throughput": 343.83, "total_tokens": 2375936} {"current_steps": 1880, "total_steps": 40000, "loss": 0.1344, "lr": 0.2983695546620362, "epoch": 0.09185742554906799, "percentage": 4.7, "elapsed_time": "1:55:13", "remaining_time": "1 day, 14:56:17", "throughput": 344.56, "total_tokens": 2382016} {"current_steps": 1885, "total_steps": 40000, "loss": 0.1218, "lr": 0.2983608817788603, "epoch": 0.09210172721276232, "percentage": 4.71, "elapsed_time": "1:55:16", "remaining_time": "1 day, 14:50:49", "throughput": 345.29, "total_tokens": 2388160} {"current_steps": 1890, "total_steps": 40000, "loss": 0.1091, "lr": 0.29835218601657193, "epoch": 0.09234602887645665, "percentage": 4.72, "elapsed_time": "1:55:19", "remaining_time": "1 day, 14:45:24", "throughput": 346.08, "total_tokens": 2394688} {"current_steps": 1895, "total_steps": 40000, "loss": 0.0905, "lr": 0.29834346737651224, "epoch": 0.09259033054015098, "percentage": 4.74, "elapsed_time": "1:55:22", "remaining_time": "1 day, 14:40:02", "throughput": 346.89, "total_tokens": 2401408} {"current_steps": 1900, "total_steps": 40000, "loss": 0.0793, "lr": 0.29833472586002563, "epoch": 0.0928346322038453, "percentage": 4.75, "elapsed_time": "1:55:25", "remaining_time": "1 day, 14:34:40", "throughput": 347.69, "total_tokens": 2408000} {"current_steps": 1905, "total_steps": 40000, "loss": 0.1061, "lr": 0.29832596146846024, "epoch": 0.09307893386753964, "percentage": 4.76, "elapsed_time": "1:55:28", "remaining_time": "1 day, 14:29:21", "throughput": 348.48, "total_tokens": 2414624} {"current_steps": 1910, "total_steps": 40000, "loss": 0.0758, "lr": 0.2983171742031676, "epoch": 0.09332323553123396, "percentage": 4.78, "elapsed_time": "1:55:31", "remaining_time": "1 day, 14:24:00", "throughput": 349.19, "total_tokens": 2420576} {"current_steps": 1915, "total_steps": 40000, "loss": 0.0761, "lr": 0.2983083640655028, "epoch": 0.0935675371949283, "percentage": 4.79, "elapsed_time": "1:55:34", "remaining_time": "1 day, 14:18:40", "throughput": 349.9, "total_tokens": 2426528} {"current_steps": 1920, "total_steps": 40000, "loss": 0.0793, "lr": 0.29829953105682455, "epoch": 0.09381183885862263, "percentage": 4.8, "elapsed_time": "1:55:37", "remaining_time": "1 day, 14:13:22", "throughput": 350.6, "total_tokens": 2432416} {"current_steps": 1925, "total_steps": 40000, "loss": 0.0511, "lr": 0.29829067517849495, "epoch": 0.09405614052231696, "percentage": 4.81, "elapsed_time": "1:55:41", "remaining_time": "1 day, 14:08:08", "throughput": 351.37, "total_tokens": 2438880} {"current_steps": 1930, "total_steps": 40000, "loss": 0.0811, "lr": 0.2982817964318797, "epoch": 0.09430044218601129, "percentage": 4.83, "elapsed_time": "1:55:44", "remaining_time": "1 day, 14:02:56", "throughput": 352.14, "total_tokens": 2445312} {"current_steps": 1935, "total_steps": 40000, "loss": 0.0792, "lr": 0.298272894818348, "epoch": 0.09454474384970561, "percentage": 4.84, "elapsed_time": "1:55:47", "remaining_time": "1 day, 13:57:47", "throughput": 352.94, "total_tokens": 2451968} {"current_steps": 1940, "total_steps": 40000, "loss": 0.1567, "lr": 0.2982639703392726, "epoch": 0.09478904551339995, "percentage": 4.85, "elapsed_time": "1:55:50", "remaining_time": "1 day, 13:52:39", "throughput": 353.78, "total_tokens": 2458976} {"current_steps": 1945, "total_steps": 40000, "loss": 0.0942, "lr": 0.29825502299602974, "epoch": 0.09503334717709427, "percentage": 4.86, "elapsed_time": "1:55:53", "remaining_time": "1 day, 13:47:32", "throughput": 354.57, "total_tokens": 2465536} {"current_steps": 1950, "total_steps": 40000, "loss": 0.0964, "lr": 0.2982460527899993, "epoch": 0.09527764884078861, "percentage": 4.88, "elapsed_time": "1:55:56", "remaining_time": "1 day, 13:42:27", "throughput": 355.35, "total_tokens": 2472096} {"current_steps": 1955, "total_steps": 40000, "loss": 0.1039, "lr": 0.29823705972256453, "epoch": 0.09552195050448294, "percentage": 4.89, "elapsed_time": "1:55:59", "remaining_time": "1 day, 13:37:22", "throughput": 356.05, "total_tokens": 2478080} {"current_steps": 1960, "total_steps": 40000, "loss": 0.0841, "lr": 0.2982280437951123, "epoch": 0.09576625216817726, "percentage": 4.9, "elapsed_time": "1:56:02", "remaining_time": "1 day, 13:32:17", "throughput": 356.8, "total_tokens": 2484384} {"current_steps": 1965, "total_steps": 40000, "loss": 0.0766, "lr": 0.298219005009033, "epoch": 0.0960105538318716, "percentage": 4.91, "elapsed_time": "1:56:06", "remaining_time": "1 day, 13:27:17", "throughput": 357.62, "total_tokens": 2491200} {"current_steps": 1970, "total_steps": 40000, "loss": 0.0601, "lr": 0.29820994336572043, "epoch": 0.09625485549556592, "percentage": 4.92, "elapsed_time": "1:56:09", "remaining_time": "1 day, 13:22:18", "throughput": 358.39, "total_tokens": 2497696} {"current_steps": 1975, "total_steps": 40000, "loss": 0.0861, "lr": 0.2982008588665721, "epoch": 0.09649915715926026, "percentage": 4.94, "elapsed_time": "1:56:12", "remaining_time": "1 day, 13:17:18", "throughput": 359.08, "total_tokens": 2503616} {"current_steps": 1980, "total_steps": 40000, "loss": 0.0591, "lr": 0.2981917515129889, "epoch": 0.09674345882295458, "percentage": 4.95, "elapsed_time": "1:56:15", "remaining_time": "1 day, 13:12:19", "throughput": 359.82, "total_tokens": 2509856} {"current_steps": 1985, "total_steps": 40000, "loss": 0.0851, "lr": 0.2981826213063753, "epoch": 0.09698776048664891, "percentage": 4.96, "elapsed_time": "1:56:18", "remaining_time": "1 day, 13:07:25", "throughput": 360.59, "total_tokens": 2516384} {"current_steps": 1990, "total_steps": 40000, "loss": 0.0872, "lr": 0.2981734682481394, "epoch": 0.09723206215034325, "percentage": 4.98, "elapsed_time": "1:56:21", "remaining_time": "1 day, 13:02:32", "throughput": 361.4, "total_tokens": 2523136} {"current_steps": 1995, "total_steps": 40000, "loss": 0.1013, "lr": 0.29816429233969255, "epoch": 0.09747636381403757, "percentage": 4.99, "elapsed_time": "1:56:24", "remaining_time": "1 day, 12:57:39", "throughput": 362.16, "total_tokens": 2529600} {"current_steps": 2000, "total_steps": 40000, "loss": 0.0793, "lr": 0.2981550935824499, "epoch": 0.09772066547773191, "percentage": 5.0, "elapsed_time": "1:56:27", "remaining_time": "1 day, 12:52:51", "throughput": 362.98, "total_tokens": 2536512} {"current_steps": 2000, "total_steps": 40000, "eval_loss": 0.08809199184179306, "epoch": 0.09772066547773191, "percentage": 5.0, "elapsed_time": "2:07:06", "remaining_time": "1 day, 16:15:05", "throughput": 332.59, "total_tokens": 2536512} {"current_steps": 2005, "total_steps": 40000, "loss": 0.0925, "lr": 0.29814587197783, "epoch": 0.09796496714142623, "percentage": 5.01, "elapsed_time": "2:07:10", "remaining_time": "1 day, 16:09:56", "throughput": 333.22, "total_tokens": 2542560} {"current_steps": 2010, "total_steps": 40000, "loss": 0.1063, "lr": 0.29813662752725495, "epoch": 0.09820926880512057, "percentage": 5.03, "elapsed_time": "2:07:13", "remaining_time": "1 day, 16:04:37", "throughput": 333.93, "total_tokens": 2549056} {"current_steps": 2015, "total_steps": 40000, "loss": 0.0916, "lr": 0.29812736023215025, "epoch": 0.0984535704688149, "percentage": 5.04, "elapsed_time": "2:07:16", "remaining_time": "1 day, 15:59:18", "throughput": 334.62, "total_tokens": 2555360} {"current_steps": 2020, "total_steps": 40000, "loss": 0.0661, "lr": 0.29811807009394514, "epoch": 0.09869787213250922, "percentage": 5.05, "elapsed_time": "2:07:19", "remaining_time": "1 day, 15:54:02", "throughput": 335.38, "total_tokens": 2562208} {"current_steps": 2025, "total_steps": 40000, "loss": 0.0738, "lr": 0.2981087571140723, "epoch": 0.09894217379620356, "percentage": 5.06, "elapsed_time": "2:07:22", "remaining_time": "1 day, 15:48:45", "throughput": 336.05, "total_tokens": 2568352} {"current_steps": 2030, "total_steps": 40000, "loss": 0.0838, "lr": 0.2980994212939678, "epoch": 0.09918647545989788, "percentage": 5.08, "elapsed_time": "2:07:25", "remaining_time": "1 day, 15:43:31", "throughput": 336.74, "total_tokens": 2574656} {"current_steps": 2035, "total_steps": 40000, "loss": 0.0577, "lr": 0.2980900626350715, "epoch": 0.09943077712359222, "percentage": 5.09, "elapsed_time": "2:07:28", "remaining_time": "1 day, 15:38:17", "throughput": 337.4, "total_tokens": 2580768} {"current_steps": 2040, "total_steps": 40000, "loss": 0.0741, "lr": 0.29808068113882646, "epoch": 0.09967507878728654, "percentage": 5.1, "elapsed_time": "2:07:31", "remaining_time": "1 day, 15:33:05", "throughput": 338.08, "total_tokens": 2586976} {"current_steps": 2045, "total_steps": 40000, "loss": 0.0712, "lr": 0.2980712768066795, "epoch": 0.09991938045098087, "percentage": 5.11, "elapsed_time": "2:07:35", "remaining_time": "1 day, 15:27:56", "throughput": 338.76, "total_tokens": 2593248} {"current_steps": 2050, "total_steps": 40000, "loss": 0.1215, "lr": 0.2980618496400809, "epoch": 0.1001636821146752, "percentage": 5.12, "elapsed_time": "2:07:38", "remaining_time": "1 day, 15:22:47", "throughput": 339.46, "total_tokens": 2599584} {"current_steps": 2055, "total_steps": 40000, "loss": 0.072, "lr": 0.2980523996404844, "epoch": 0.10040798377836953, "percentage": 5.14, "elapsed_time": "2:07:41", "remaining_time": "1 day, 15:17:40", "throughput": 340.13, "total_tokens": 2605760} {"current_steps": 2060, "total_steps": 40000, "loss": 0.1022, "lr": 0.2980429268093473, "epoch": 0.10065228544206387, "percentage": 5.15, "elapsed_time": "2:07:44", "remaining_time": "1 day, 15:12:34", "throughput": 340.8, "total_tokens": 2611968} {"current_steps": 2065, "total_steps": 40000, "loss": 0.0668, "lr": 0.29803343114813047, "epoch": 0.10089658710575819, "percentage": 5.16, "elapsed_time": "2:07:47", "remaining_time": "1 day, 15:07:29", "throughput": 341.45, "total_tokens": 2617952} {"current_steps": 2070, "total_steps": 40000, "loss": 0.066, "lr": 0.2980239126582983, "epoch": 0.10114088876945251, "percentage": 5.17, "elapsed_time": "2:07:50", "remaining_time": "1 day, 15:02:27", "throughput": 342.13, "total_tokens": 2624224} {"current_steps": 2075, "total_steps": 40000, "loss": 0.1104, "lr": 0.2980143713413186, "epoch": 0.10138519043314685, "percentage": 5.19, "elapsed_time": "2:07:53", "remaining_time": "1 day, 14:57:26", "throughput": 342.82, "total_tokens": 2630560} {"current_steps": 2080, "total_steps": 40000, "loss": 0.0821, "lr": 0.29800480719866274, "epoch": 0.10162949209684118, "percentage": 5.2, "elapsed_time": "2:07:56", "remaining_time": "1 day, 14:52:25", "throughput": 343.49, "total_tokens": 2636768} {"current_steps": 2085, "total_steps": 40000, "loss": 0.0868, "lr": 0.2979952202318057, "epoch": 0.10187379376053551, "percentage": 5.21, "elapsed_time": "2:07:59", "remaining_time": "1 day, 14:47:26", "throughput": 344.15, "total_tokens": 2642848} {"current_steps": 2090, "total_steps": 40000, "loss": 0.0751, "lr": 0.2979856104422259, "epoch": 0.10211809542422984, "percentage": 5.22, "elapsed_time": "2:08:02", "remaining_time": "1 day, 14:42:30", "throughput": 344.85, "total_tokens": 2649280} {"current_steps": 2095, "total_steps": 40000, "loss": 0.082, "lr": 0.2979759778314052, "epoch": 0.10236239708792418, "percentage": 5.24, "elapsed_time": "2:08:05", "remaining_time": "1 day, 14:37:34", "throughput": 345.51, "total_tokens": 2655424} {"current_steps": 2100, "total_steps": 40000, "loss": 0.11, "lr": 0.2979663224008292, "epoch": 0.1026066987516185, "percentage": 5.25, "elapsed_time": "2:08:08", "remaining_time": "1 day, 14:32:38", "throughput": 346.13, "total_tokens": 2661184} {"current_steps": 2105, "total_steps": 40000, "loss": 0.0707, "lr": 0.2979566441519868, "epoch": 0.10285100041531282, "percentage": 5.26, "elapsed_time": "2:08:11", "remaining_time": "1 day, 14:27:45", "throughput": 346.8, "total_tokens": 2667424} {"current_steps": 2110, "total_steps": 40000, "loss": 0.0816, "lr": 0.29794694308637054, "epoch": 0.10309530207900716, "percentage": 5.27, "elapsed_time": "2:08:14", "remaining_time": "1 day, 14:22:54", "throughput": 347.49, "total_tokens": 2673824} {"current_steps": 2115, "total_steps": 40000, "loss": 0.1031, "lr": 0.2979372192054764, "epoch": 0.10333960374270149, "percentage": 5.29, "elapsed_time": "2:08:17", "remaining_time": "1 day, 14:18:05", "throughput": 348.2, "total_tokens": 2680320} {"current_steps": 2120, "total_steps": 40000, "loss": 0.0762, "lr": 0.297927472510804, "epoch": 0.10358390540639582, "percentage": 5.3, "elapsed_time": "2:08:20", "remaining_time": "1 day, 14:13:16", "throughput": 348.85, "total_tokens": 2686432} {"current_steps": 2125, "total_steps": 40000, "loss": 0.0856, "lr": 0.29791770300385634, "epoch": 0.10382820707009015, "percentage": 5.31, "elapsed_time": "2:08:23", "remaining_time": "1 day, 14:08:27", "throughput": 349.51, "total_tokens": 2692512} {"current_steps": 2130, "total_steps": 40000, "loss": 0.093, "lr": 0.29790791068614003, "epoch": 0.10407250873378447, "percentage": 5.33, "elapsed_time": "2:08:26", "remaining_time": "1 day, 14:03:42", "throughput": 350.2, "total_tokens": 2698912} {"current_steps": 2135, "total_steps": 40000, "loss": 0.0967, "lr": 0.2978980955591652, "epoch": 0.10431681039747881, "percentage": 5.34, "elapsed_time": "2:08:30", "remaining_time": "1 day, 13:59:00", "throughput": 350.95, "total_tokens": 2705824} {"current_steps": 2140, "total_steps": 40000, "loss": 0.0546, "lr": 0.2978882576244454, "epoch": 0.10456111206117313, "percentage": 5.35, "elapsed_time": "2:08:33", "remaining_time": "1 day, 13:54:17", "throughput": 351.64, "total_tokens": 2712256} {"current_steps": 2145, "total_steps": 40000, "loss": 0.0841, "lr": 0.2978783968834978, "epoch": 0.10480541372486747, "percentage": 5.36, "elapsed_time": "2:08:36", "remaining_time": "1 day, 13:49:35", "throughput": 352.32, "total_tokens": 2718592} {"current_steps": 2150, "total_steps": 40000, "loss": 0.0538, "lr": 0.29786851333784303, "epoch": 0.1050497153885618, "percentage": 5.38, "elapsed_time": "2:08:39", "remaining_time": "1 day, 13:44:57", "throughput": 353.1, "total_tokens": 2725696} {"current_steps": 2155, "total_steps": 40000, "loss": 0.0859, "lr": 0.2978586069890053, "epoch": 0.10529401705225612, "percentage": 5.39, "elapsed_time": "2:08:42", "remaining_time": "1 day, 13:40:17", "throughput": 353.75, "total_tokens": 2731808} {"current_steps": 2160, "total_steps": 40000, "loss": 0.0994, "lr": 0.29784867783851227, "epoch": 0.10553831871595046, "percentage": 5.4, "elapsed_time": "2:08:45", "remaining_time": "1 day, 13:35:40", "throughput": 354.45, "total_tokens": 2738336} {"current_steps": 2165, "total_steps": 40000, "loss": 0.0956, "lr": 0.2978387258878951, "epoch": 0.10578262037964478, "percentage": 5.41, "elapsed_time": "2:08:48", "remaining_time": "1 day, 13:31:04", "throughput": 355.12, "total_tokens": 2744608} {"current_steps": 2170, "total_steps": 40000, "loss": 0.042, "lr": 0.29782875113868856, "epoch": 0.10602692204333912, "percentage": 5.42, "elapsed_time": "2:08:51", "remaining_time": "1 day, 13:26:31", "throughput": 355.9, "total_tokens": 2751776} {"current_steps": 2175, "total_steps": 40000, "loss": 0.0712, "lr": 0.2978187535924309, "epoch": 0.10627122370703344, "percentage": 5.44, "elapsed_time": "2:08:55", "remaining_time": "1 day, 13:21:58", "throughput": 356.58, "total_tokens": 2758176} {"current_steps": 2180, "total_steps": 40000, "loss": 0.1099, "lr": 0.29780873325066376, "epoch": 0.10651552537072777, "percentage": 5.45, "elapsed_time": "2:08:58", "remaining_time": "1 day, 13:17:27", "throughput": 357.28, "total_tokens": 2764704} {"current_steps": 2185, "total_steps": 40000, "loss": 0.0897, "lr": 0.2977986901149325, "epoch": 0.1067598270344221, "percentage": 5.46, "elapsed_time": "2:09:01", "remaining_time": "1 day, 13:12:55", "throughput": 357.96, "total_tokens": 2771040} {"current_steps": 2190, "total_steps": 40000, "loss": 0.1049, "lr": 0.29778862418678587, "epoch": 0.10700412869811643, "percentage": 5.47, "elapsed_time": "2:09:04", "remaining_time": "1 day, 13:08:24", "throughput": 358.63, "total_tokens": 2777344} {"current_steps": 2195, "total_steps": 40000, "loss": 0.1154, "lr": 0.29777853546777616, "epoch": 0.10724843036181077, "percentage": 5.49, "elapsed_time": "2:09:07", "remaining_time": "1 day, 13:03:58", "throughput": 359.39, "total_tokens": 2784384} {"current_steps": 2200, "total_steps": 40000, "loss": 0.1019, "lr": 0.2977684239594592, "epoch": 0.10749273202550509, "percentage": 5.5, "elapsed_time": "2:09:10", "remaining_time": "1 day, 12:59:30", "throughput": 360.07, "total_tokens": 2790752} {"current_steps": 2200, "total_steps": 40000, "eval_loss": 0.11207126826047897, "epoch": 0.10749273202550509, "percentage": 5.5, "elapsed_time": "2:19:49", "remaining_time": "1 day, 16:02:22", "throughput": 332.66, "total_tokens": 2790752} {"current_steps": 2205, "total_steps": 40000, "loss": 0.088, "lr": 0.29775828966339424, "epoch": 0.10773703368919943, "percentage": 5.51, "elapsed_time": "2:19:53", "remaining_time": "1 day, 15:57:48", "throughput": 333.26, "total_tokens": 2797216} {"current_steps": 2210, "total_steps": 40000, "loss": 0.0671, "lr": 0.29774813258114424, "epoch": 0.10798133535289375, "percentage": 5.53, "elapsed_time": "2:19:56", "remaining_time": "1 day, 15:52:55", "throughput": 333.84, "total_tokens": 2803072} {"current_steps": 2215, "total_steps": 40000, "loss": 0.0783, "lr": 0.29773795271427544, "epoch": 0.10822563701658808, "percentage": 5.54, "elapsed_time": "2:19:59", "remaining_time": "1 day, 15:48:04", "throughput": 334.47, "total_tokens": 2809376} {"current_steps": 2220, "total_steps": 40000, "loss": 0.0901, "lr": 0.2977277500643577, "epoch": 0.10846993868028242, "percentage": 5.55, "elapsed_time": "2:20:02", "remaining_time": "1 day, 15:43:14", "throughput": 335.08, "total_tokens": 2815552} {"current_steps": 2225, "total_steps": 40000, "loss": 0.0638, "lr": 0.29771752463296447, "epoch": 0.10871424034397674, "percentage": 5.56, "elapsed_time": "2:20:05", "remaining_time": "1 day, 15:38:25", "throughput": 335.66, "total_tokens": 2821440} {"current_steps": 2230, "total_steps": 40000, "loss": 0.09, "lr": 0.29770727642167266, "epoch": 0.10895854200767108, "percentage": 5.58, "elapsed_time": "2:20:08", "remaining_time": "1 day, 15:33:38", "throughput": 336.28, "total_tokens": 2827616} {"current_steps": 2235, "total_steps": 40000, "loss": 0.1395, "lr": 0.29769700543206257, "epoch": 0.1092028436713654, "percentage": 5.59, "elapsed_time": "2:20:11", "remaining_time": "1 day, 15:28:53", "throughput": 336.92, "total_tokens": 2834080} {"current_steps": 2240, "total_steps": 40000, "loss": 0.1017, "lr": 0.2976867116657182, "epoch": 0.10944714533505973, "percentage": 5.6, "elapsed_time": "2:20:14", "remaining_time": "1 day, 15:24:08", "throughput": 337.53, "total_tokens": 2840224} {"current_steps": 2245, "total_steps": 40000, "loss": 0.0921, "lr": 0.2976763951242269, "epoch": 0.10969144699875406, "percentage": 5.61, "elapsed_time": "2:20:17", "remaining_time": "1 day, 15:19:24", "throughput": 338.12, "total_tokens": 2846208} {"current_steps": 2250, "total_steps": 40000, "loss": 0.0849, "lr": 0.29766605580917965, "epoch": 0.10993574866244839, "percentage": 5.62, "elapsed_time": "2:20:20", "remaining_time": "1 day, 15:14:43", "throughput": 338.76, "total_tokens": 2852704} {"current_steps": 2255, "total_steps": 40000, "loss": 0.0943, "lr": 0.29765569372217093, "epoch": 0.11018005032614273, "percentage": 5.64, "elapsed_time": "2:20:24", "remaining_time": "1 day, 15:10:04", "throughput": 339.42, "total_tokens": 2859264} {"current_steps": 2260, "total_steps": 40000, "loss": 0.1166, "lr": 0.2976453088647987, "epoch": 0.11042435198983705, "percentage": 5.65, "elapsed_time": "2:20:27", "remaining_time": "1 day, 15:05:26", "throughput": 340.08, "total_tokens": 2865888} {"current_steps": 2265, "total_steps": 40000, "loss": 0.101, "lr": 0.2976349012386644, "epoch": 0.11066865365353137, "percentage": 5.66, "elapsed_time": "2:20:30", "remaining_time": "1 day, 15:00:48", "throughput": 340.67, "total_tokens": 2871968} {"current_steps": 2270, "total_steps": 40000, "loss": 0.0619, "lr": 0.29762447084537297, "epoch": 0.11091295531722571, "percentage": 5.67, "elapsed_time": "2:20:33", "remaining_time": "1 day, 14:56:12", "throughput": 341.31, "total_tokens": 2878432} {"current_steps": 2275, "total_steps": 40000, "loss": 0.087, "lr": 0.29761401768653306, "epoch": 0.11115725698092004, "percentage": 5.69, "elapsed_time": "2:20:36", "remaining_time": "1 day, 14:51:39", "throughput": 342.02, "total_tokens": 2885472} {"current_steps": 2280, "total_steps": 40000, "loss": 0.076, "lr": 0.29760354176375653, "epoch": 0.11140155864461437, "percentage": 5.7, "elapsed_time": "2:20:39", "remaining_time": "1 day, 14:47:03", "throughput": 342.62, "total_tokens": 2891584} {"current_steps": 2285, "total_steps": 40000, "loss": 0.1031, "lr": 0.29759304307865897, "epoch": 0.1116458603083087, "percentage": 5.71, "elapsed_time": "2:20:42", "remaining_time": "1 day, 14:42:31", "throughput": 343.25, "total_tokens": 2897984} {"current_steps": 2290, "total_steps": 40000, "loss": 0.0879, "lr": 0.2975825216328594, "epoch": 0.11189016197200304, "percentage": 5.73, "elapsed_time": "2:20:45", "remaining_time": "1 day, 14:37:59", "throughput": 343.87, "total_tokens": 2904224} {"current_steps": 2295, "total_steps": 40000, "loss": 0.059, "lr": 0.2975719774279804, "epoch": 0.11213446363569736, "percentage": 5.74, "elapsed_time": "2:20:48", "remaining_time": "1 day, 14:33:28", "throughput": 344.49, "total_tokens": 2910592} {"current_steps": 2300, "total_steps": 40000, "loss": 0.0743, "lr": 0.29756141046564794, "epoch": 0.11237876529939168, "percentage": 5.75, "elapsed_time": "2:20:51", "remaining_time": "1 day, 14:28:58", "throughput": 345.09, "total_tokens": 2916640} {"current_steps": 2305, "total_steps": 40000, "loss": 0.1838, "lr": 0.2975508207474916, "epoch": 0.11262306696308602, "percentage": 5.76, "elapsed_time": "2:20:54", "remaining_time": "1 day, 14:24:29", "throughput": 345.68, "total_tokens": 2922688} {"current_steps": 2310, "total_steps": 40000, "loss": 0.1095, "lr": 0.2975402082751445, "epoch": 0.11286736862678035, "percentage": 5.78, "elapsed_time": "2:20:58", "remaining_time": "1 day, 14:20:02", "throughput": 346.29, "total_tokens": 2928992} {"current_steps": 2315, "total_steps": 40000, "loss": 0.0778, "lr": 0.29752957305024313, "epoch": 0.11311167029047468, "percentage": 5.79, "elapsed_time": "2:21:01", "remaining_time": "1 day, 14:15:37", "throughput": 346.97, "total_tokens": 2935776} {"current_steps": 2320, "total_steps": 40000, "loss": 0.1245, "lr": 0.2975189150744277, "epoch": 0.11335597195416901, "percentage": 5.8, "elapsed_time": "2:21:04", "remaining_time": "1 day, 14:11:15", "throughput": 347.65, "total_tokens": 2942656} {"current_steps": 2325, "total_steps": 40000, "loss": 0.0929, "lr": 0.29750823434934165, "epoch": 0.11360027361786333, "percentage": 5.81, "elapsed_time": "2:21:07", "remaining_time": "1 day, 14:06:50", "throughput": 348.22, "total_tokens": 2948544} {"current_steps": 2330, "total_steps": 40000, "loss": 0.1025, "lr": 0.29749753087663217, "epoch": 0.11384457528155767, "percentage": 5.83, "elapsed_time": "2:21:10", "remaining_time": "1 day, 14:02:29", "throughput": 348.9, "total_tokens": 2955424} {"current_steps": 2335, "total_steps": 40000, "loss": 0.0682, "lr": 0.29748680465794985, "epoch": 0.114088876945252, "percentage": 5.84, "elapsed_time": "2:21:13", "remaining_time": "1 day, 13:58:08", "throughput": 349.53, "total_tokens": 2961888} {"current_steps": 2340, "total_steps": 40000, "loss": 0.1249, "lr": 0.29747605569494884, "epoch": 0.11433317860894633, "percentage": 5.85, "elapsed_time": "2:21:16", "remaining_time": "1 day, 13:53:47", "throughput": 350.15, "total_tokens": 2968192} {"current_steps": 2345, "total_steps": 40000, "loss": 0.0865, "lr": 0.29746528398928673, "epoch": 0.11457748027264066, "percentage": 5.86, "elapsed_time": "2:21:19", "remaining_time": "1 day, 13:49:27", "throughput": 350.74, "total_tokens": 2974304} {"current_steps": 2350, "total_steps": 40000, "loss": 0.116, "lr": 0.2974544895426247, "epoch": 0.11482178193633498, "percentage": 5.88, "elapsed_time": "2:21:23", "remaining_time": "1 day, 13:45:11", "throughput": 351.41, "total_tokens": 2981056} {"current_steps": 2355, "total_steps": 40000, "loss": 0.0953, "lr": 0.29744367235662733, "epoch": 0.11506608360002932, "percentage": 5.89, "elapsed_time": "2:21:26", "remaining_time": "1 day, 13:40:53", "throughput": 352.0, "total_tokens": 2987168} {"current_steps": 2360, "total_steps": 40000, "loss": 0.1115, "lr": 0.29743283243296276, "epoch": 0.11531038526372364, "percentage": 5.9, "elapsed_time": "2:21:29", "remaining_time": "1 day, 13:36:35", "throughput": 352.55, "total_tokens": 2992896} {"current_steps": 2365, "total_steps": 40000, "loss": 0.0994, "lr": 0.29742196977330276, "epoch": 0.11555468692741798, "percentage": 5.91, "elapsed_time": "2:21:32", "remaining_time": "1 day, 13:32:19", "throughput": 353.17, "total_tokens": 2999168} {"current_steps": 2370, "total_steps": 40000, "loss": 0.0663, "lr": 0.2974110843793223, "epoch": 0.1157989885911123, "percentage": 5.92, "elapsed_time": "2:21:35", "remaining_time": "1 day, 13:28:04", "throughput": 353.73, "total_tokens": 3005024} {"current_steps": 2375, "total_steps": 40000, "loss": 0.0619, "lr": 0.2974001762527002, "epoch": 0.11604329025480664, "percentage": 5.94, "elapsed_time": "2:21:38", "remaining_time": "1 day, 13:23:52", "throughput": 354.38, "total_tokens": 3011616} {"current_steps": 2380, "total_steps": 40000, "loss": 0.0781, "lr": 0.2973892453951186, "epoch": 0.11628759191850097, "percentage": 5.95, "elapsed_time": "2:21:41", "remaining_time": "1 day, 13:19:40", "throughput": 355.0, "total_tokens": 3017984} {"current_steps": 2385, "total_steps": 40000, "loss": 0.0654, "lr": 0.2973782918082631, "epoch": 0.11653189358219529, "percentage": 5.96, "elapsed_time": "2:21:44", "remaining_time": "1 day, 13:15:29", "throughput": 355.62, "total_tokens": 3024416} {"current_steps": 2390, "total_steps": 40000, "loss": 0.0766, "lr": 0.29736731549382295, "epoch": 0.11677619524588963, "percentage": 5.97, "elapsed_time": "2:21:47", "remaining_time": "1 day, 13:11:20", "throughput": 356.24, "total_tokens": 3030816} {"current_steps": 2395, "total_steps": 40000, "loss": 0.069, "lr": 0.2973563164534908, "epoch": 0.11702049690958395, "percentage": 5.99, "elapsed_time": "2:21:50", "remaining_time": "1 day, 13:07:11", "throughput": 356.83, "total_tokens": 3036928} {"current_steps": 2400, "total_steps": 40000, "loss": 0.0926, "lr": 0.29734529468896287, "epoch": 0.11726479857327829, "percentage": 6.0, "elapsed_time": "2:21:53", "remaining_time": "1 day, 13:03:03", "throughput": 357.44, "total_tokens": 3043136} {"current_steps": 2400, "total_steps": 40000, "eval_loss": 0.1081715002655983, "epoch": 0.11726479857327829, "percentage": 6.0, "elapsed_time": "2:32:32", "remaining_time": "1 day, 15:49:48", "throughput": 332.49, "total_tokens": 3043136} {"current_steps": 2405, "total_steps": 40000, "loss": 0.077, "lr": 0.2973342502019388, "epoch": 0.11750910023697261, "percentage": 6.01, "elapsed_time": "2:32:36", "remaining_time": "1 day, 15:45:29", "throughput": 333.1, "total_tokens": 3049888} {"current_steps": 2410, "total_steps": 40000, "loss": 0.0476, "lr": 0.2973231829941219, "epoch": 0.11775340190066694, "percentage": 6.02, "elapsed_time": "2:32:39", "remaining_time": "1 day, 15:41:02", "throughput": 333.67, "total_tokens": 3056160} {"current_steps": 2415, "total_steps": 40000, "loss": 0.0896, "lr": 0.2973120930672188, "epoch": 0.11799770356436128, "percentage": 6.04, "elapsed_time": "2:32:42", "remaining_time": "1 day, 15:36:34", "throughput": 334.19, "total_tokens": 3061984} {"current_steps": 2420, "total_steps": 40000, "loss": 0.0722, "lr": 0.2973009804229397, "epoch": 0.1182420052280556, "percentage": 6.05, "elapsed_time": "2:32:45", "remaining_time": "1 day, 15:32:07", "throughput": 334.74, "total_tokens": 3068032} {"current_steps": 2425, "total_steps": 40000, "loss": 0.0958, "lr": 0.29728984506299827, "epoch": 0.11848630689174994, "percentage": 6.06, "elapsed_time": "2:32:48", "remaining_time": "1 day, 15:27:43", "throughput": 335.34, "total_tokens": 3074496} {"current_steps": 2430, "total_steps": 40000, "loss": 0.1378, "lr": 0.2972786869891118, "epoch": 0.11873060855544426, "percentage": 6.08, "elapsed_time": "2:32:51", "remaining_time": "1 day, 15:23:19", "throughput": 335.92, "total_tokens": 3080896} {"current_steps": 2435, "total_steps": 40000, "loss": 0.0762, "lr": 0.29726750620300096, "epoch": 0.11897491021913859, "percentage": 6.09, "elapsed_time": "2:32:54", "remaining_time": "1 day, 15:18:58", "throughput": 336.52, "total_tokens": 3087424} {"current_steps": 2440, "total_steps": 40000, "loss": 0.0686, "lr": 0.29725630270639003, "epoch": 0.11921921188283292, "percentage": 6.1, "elapsed_time": "2:32:57", "remaining_time": "1 day, 15:14:35", "throughput": 337.07, "total_tokens": 3093504} {"current_steps": 2445, "total_steps": 40000, "loss": 0.0804, "lr": 0.2972450765010067, "epoch": 0.11946351354652725, "percentage": 6.11, "elapsed_time": "2:33:00", "remaining_time": "1 day, 15:10:13", "throughput": 337.61, "total_tokens": 3099488} {"current_steps": 2450, "total_steps": 40000, "loss": 0.0982, "lr": 0.29723382758858213, "epoch": 0.11970781521022159, "percentage": 6.12, "elapsed_time": "2:33:03", "remaining_time": "1 day, 15:05:54", "throughput": 338.17, "total_tokens": 3105664} {"current_steps": 2455, "total_steps": 40000, "loss": 0.0879, "lr": 0.29722255597085107, "epoch": 0.11995211687391591, "percentage": 6.14, "elapsed_time": "2:33:06", "remaining_time": "1 day, 15:01:36", "throughput": 338.77, "total_tokens": 3112192} {"current_steps": 2460, "total_steps": 40000, "loss": 0.0807, "lr": 0.2972112616495518, "epoch": 0.12019641853761025, "percentage": 6.15, "elapsed_time": "2:33:09", "remaining_time": "1 day, 14:57:19", "throughput": 339.35, "total_tokens": 3118592} {"current_steps": 2465, "total_steps": 40000, "loss": 0.0818, "lr": 0.297199944626426, "epoch": 0.12044072020130457, "percentage": 6.16, "elapsed_time": "2:33:12", "remaining_time": "1 day, 14:53:01", "throughput": 339.88, "total_tokens": 3124480} {"current_steps": 2470, "total_steps": 40000, "loss": 0.0964, "lr": 0.2971886049032189, "epoch": 0.1206850218649989, "percentage": 6.17, "elapsed_time": "2:33:15", "remaining_time": "1 day, 14:48:45", "throughput": 340.46, "total_tokens": 3130848} {"current_steps": 2475, "total_steps": 40000, "loss": 0.0919, "lr": 0.29717724248167926, "epoch": 0.12092932352869323, "percentage": 6.19, "elapsed_time": "2:33:19", "remaining_time": "1 day, 14:44:32", "throughput": 341.03, "total_tokens": 3137120} {"current_steps": 2480, "total_steps": 40000, "loss": 0.0745, "lr": 0.29716585736355927, "epoch": 0.12117362519238756, "percentage": 6.2, "elapsed_time": "2:33:22", "remaining_time": "1 day, 14:40:19", "throughput": 341.6, "total_tokens": 3143456} {"current_steps": 2485, "total_steps": 40000, "loss": 0.0838, "lr": 0.2971544495506147, "epoch": 0.1214179268560819, "percentage": 6.21, "elapsed_time": "2:33:25", "remaining_time": "1 day, 14:36:07", "throughput": 342.16, "total_tokens": 3149664} {"current_steps": 2490, "total_steps": 40000, "loss": 0.0804, "lr": 0.2971430190446048, "epoch": 0.12166222851977622, "percentage": 6.22, "elapsed_time": "2:33:28", "remaining_time": "1 day, 14:31:56", "throughput": 342.74, "total_tokens": 3156032} {"current_steps": 2495, "total_steps": 40000, "loss": 0.089, "lr": 0.2971315658472921, "epoch": 0.12190653018347054, "percentage": 6.24, "elapsed_time": "2:33:31", "remaining_time": "1 day, 14:27:47", "throughput": 343.33, "total_tokens": 3162560} {"current_steps": 2500, "total_steps": 40000, "loss": 0.0758, "lr": 0.2971200899604431, "epoch": 0.12215083184716488, "percentage": 6.25, "elapsed_time": "2:33:34", "remaining_time": "1 day, 14:23:38", "throughput": 343.9, "total_tokens": 3168864} {"current_steps": 2505, "total_steps": 40000, "loss": 0.0797, "lr": 0.29710859138582735, "epoch": 0.1223951335108592, "percentage": 6.26, "elapsed_time": "2:33:37", "remaining_time": "1 day, 14:19:31", "throughput": 344.49, "total_tokens": 3175424} {"current_steps": 2510, "total_steps": 40000, "loss": 0.0743, "lr": 0.29709707012521813, "epoch": 0.12263943517455354, "percentage": 6.28, "elapsed_time": "2:33:40", "remaining_time": "1 day, 14:15:24", "throughput": 345.06, "total_tokens": 3181696} {"current_steps": 2515, "total_steps": 40000, "loss": 0.0792, "lr": 0.29708552618039213, "epoch": 0.12288373683824787, "percentage": 6.29, "elapsed_time": "2:33:43", "remaining_time": "1 day, 14:11:19", "throughput": 345.67, "total_tokens": 3188416} {"current_steps": 2520, "total_steps": 40000, "loss": 0.0971, "lr": 0.2970739595531296, "epoch": 0.12312803850194219, "percentage": 6.3, "elapsed_time": "2:33:47", "remaining_time": "1 day, 14:07:13", "throughput": 346.23, "total_tokens": 3194624} {"current_steps": 2525, "total_steps": 40000, "loss": 0.0909, "lr": 0.2970623702452143, "epoch": 0.12337234016563653, "percentage": 6.31, "elapsed_time": "2:33:50", "remaining_time": "1 day, 14:03:08", "throughput": 346.78, "total_tokens": 3200832} {"current_steps": 2530, "total_steps": 40000, "loss": 0.0743, "lr": 0.2970507582584334, "epoch": 0.12361664182933085, "percentage": 6.33, "elapsed_time": "2:33:53", "remaining_time": "1 day, 13:59:07", "throughput": 347.44, "total_tokens": 3208000} {"current_steps": 2535, "total_steps": 40000, "loss": 0.0932, "lr": 0.2970391235945776, "epoch": 0.12386094349302519, "percentage": 6.34, "elapsed_time": "2:33:56", "remaining_time": "1 day, 13:55:06", "throughput": 348.04, "total_tokens": 3214656} {"current_steps": 2540, "total_steps": 40000, "loss": 0.1249, "lr": 0.2970274662554412, "epoch": 0.12410524515671952, "percentage": 6.35, "elapsed_time": "2:33:59", "remaining_time": "1 day, 13:51:04", "throughput": 348.6, "total_tokens": 3220864} {"current_steps": 2545, "total_steps": 40000, "loss": 0.1091, "lr": 0.2970157862428218, "epoch": 0.12434954682041385, "percentage": 6.36, "elapsed_time": "2:34:02", "remaining_time": "1 day, 13:47:04", "throughput": 349.19, "total_tokens": 3227424} {"current_steps": 2550, "total_steps": 40000, "loss": 0.0852, "lr": 0.2970040835585206, "epoch": 0.12459384848410818, "percentage": 6.38, "elapsed_time": "2:34:05", "remaining_time": "1 day, 13:43:05", "throughput": 349.77, "total_tokens": 3233888} {"current_steps": 2555, "total_steps": 40000, "loss": 0.0737, "lr": 0.2969923582043424, "epoch": 0.1248381501478025, "percentage": 6.39, "elapsed_time": "2:34:08", "remaining_time": "1 day, 13:39:07", "throughput": 350.36, "total_tokens": 3240448} {"current_steps": 2560, "total_steps": 40000, "loss": 0.1194, "lr": 0.2969806101820953, "epoch": 0.12508245181149683, "percentage": 6.4, "elapsed_time": "2:34:12", "remaining_time": "1 day, 13:35:10", "throughput": 350.94, "total_tokens": 3246880} {"current_steps": 2565, "total_steps": 40000, "loss": 0.0665, "lr": 0.2969688394935911, "epoch": 0.12532675347519118, "percentage": 6.41, "elapsed_time": "2:34:15", "remaining_time": "1 day, 13:31:14", "throughput": 351.5, "total_tokens": 3253184} {"current_steps": 2570, "total_steps": 40000, "loss": 0.0557, "lr": 0.2969570461406449, "epoch": 0.1255710551388855, "percentage": 6.42, "elapsed_time": "2:34:18", "remaining_time": "1 day, 13:27:18", "throughput": 352.06, "total_tokens": 3259456} {"current_steps": 2575, "total_steps": 40000, "loss": 0.0923, "lr": 0.29694523012507534, "epoch": 0.12581535680257983, "percentage": 6.44, "elapsed_time": "2:34:21", "remaining_time": "1 day, 13:23:23", "throughput": 352.66, "total_tokens": 3266112} {"current_steps": 2580, "total_steps": 40000, "loss": 0.106, "lr": 0.2969333914487048, "epoch": 0.12605965846627415, "percentage": 6.45, "elapsed_time": "2:34:24", "remaining_time": "1 day, 13:19:29", "throughput": 353.23, "total_tokens": 3272448} {"current_steps": 2585, "total_steps": 40000, "loss": 0.0718, "lr": 0.2969215301133587, "epoch": 0.12630396012996847, "percentage": 6.46, "elapsed_time": "2:34:27", "remaining_time": "1 day, 13:15:36", "throughput": 353.78, "total_tokens": 3278624} {"current_steps": 2590, "total_steps": 40000, "loss": 0.0718, "lr": 0.29690964612086634, "epoch": 0.12654826179366283, "percentage": 6.48, "elapsed_time": "2:34:30", "remaining_time": "1 day, 13:11:46", "throughput": 354.41, "total_tokens": 3285632} {"current_steps": 2595, "total_steps": 40000, "loss": 0.0952, "lr": 0.2968977394730604, "epoch": 0.12679256345735715, "percentage": 6.49, "elapsed_time": "2:34:33", "remaining_time": "1 day, 13:07:56", "throughput": 355.0, "total_tokens": 3292256} {"current_steps": 2600, "total_steps": 40000, "loss": 0.065, "lr": 0.296885810171777, "epoch": 0.12703686512105147, "percentage": 6.5, "elapsed_time": "2:34:36", "remaining_time": "1 day, 13:04:04", "throughput": 355.56, "total_tokens": 3298464} {"current_steps": 2600, "total_steps": 40000, "eval_loss": 0.08662457019090652, "epoch": 0.12703686512105147, "percentage": 6.5, "elapsed_time": "2:45:16", "remaining_time": "1 day, 15:37:18", "throughput": 332.64, "total_tokens": 3298464} {"current_steps": 2605, "total_steps": 40000, "loss": 0.0977, "lr": 0.2968738582188558, "epoch": 0.1272811667847458, "percentage": 6.51, "elapsed_time": "2:45:19", "remaining_time": "1 day, 15:33:18", "throughput": 333.13, "total_tokens": 3304544} {"current_steps": 2610, "total_steps": 40000, "loss": 0.0982, "lr": 0.2968618836161399, "epoch": 0.12752546844844012, "percentage": 6.53, "elapsed_time": "2:45:22", "remaining_time": "1 day, 15:29:12", "throughput": 333.71, "total_tokens": 3311392} {"current_steps": 2615, "total_steps": 40000, "loss": 0.0797, "lr": 0.296849886365476, "epoch": 0.12776977011213447, "percentage": 6.54, "elapsed_time": "2:45:26", "remaining_time": "1 day, 15:25:07", "throughput": 334.29, "total_tokens": 3318208} {"current_steps": 2620, "total_steps": 40000, "loss": 0.094, "lr": 0.2968378664687142, "epoch": 0.1280140717758288, "percentage": 6.55, "elapsed_time": "2:45:29", "remaining_time": "1 day, 15:21:03", "throughput": 334.87, "total_tokens": 3324992} {"current_steps": 2625, "total_steps": 40000, "loss": 0.0788, "lr": 0.296825823927708, "epoch": 0.12825837343952312, "percentage": 6.56, "elapsed_time": "2:45:32", "remaining_time": "1 day, 15:16:58", "throughput": 335.4, "total_tokens": 3331328} {"current_steps": 2630, "total_steps": 40000, "loss": 0.0856, "lr": 0.29681375874431476, "epoch": 0.12850267510321745, "percentage": 6.58, "elapsed_time": "2:45:35", "remaining_time": "1 day, 15:12:56", "throughput": 336.0, "total_tokens": 3338400} {"current_steps": 2635, "total_steps": 40000, "loss": 0.095, "lr": 0.29680167092039483, "epoch": 0.12874697676691177, "percentage": 6.59, "elapsed_time": "2:45:38", "remaining_time": "1 day, 15:08:52", "throughput": 336.51, "total_tokens": 3344480} {"current_steps": 2640, "total_steps": 40000, "loss": 0.119, "lr": 0.2967895604578125, "epoch": 0.12899127843060612, "percentage": 6.6, "elapsed_time": "2:45:41", "remaining_time": "1 day, 15:04:52", "throughput": 337.1, "total_tokens": 3351360} {"current_steps": 2645, "total_steps": 40000, "loss": 0.1132, "lr": 0.2967774273584352, "epoch": 0.12923558009430045, "percentage": 6.61, "elapsed_time": "2:45:45", "remaining_time": "1 day, 15:00:52", "throughput": 337.66, "total_tokens": 3358016} {"current_steps": 2650, "total_steps": 40000, "loss": 0.0753, "lr": 0.2967652716241342, "epoch": 0.12947988175799477, "percentage": 6.62, "elapsed_time": "2:45:48", "remaining_time": "1 day, 14:56:52", "throughput": 338.2, "total_tokens": 3364480} {"current_steps": 2655, "total_steps": 40000, "loss": 0.0866, "lr": 0.29675309325678384, "epoch": 0.1297241834216891, "percentage": 6.64, "elapsed_time": "2:45:51", "remaining_time": "1 day, 14:52:53", "throughput": 338.76, "total_tokens": 3371136} {"current_steps": 2660, "total_steps": 40000, "loss": 0.0726, "lr": 0.29674089225826233, "epoch": 0.12996848508538345, "percentage": 6.65, "elapsed_time": "2:45:54", "remaining_time": "1 day, 14:48:53", "throughput": 339.25, "total_tokens": 3377024} {"current_steps": 2665, "total_steps": 40000, "loss": 0.0908, "lr": 0.29672866863045116, "epoch": 0.13021278674907777, "percentage": 6.66, "elapsed_time": "2:45:57", "remaining_time": "1 day, 14:44:56", "throughput": 339.79, "total_tokens": 3383456} {"current_steps": 2670, "total_steps": 40000, "loss": 0.0784, "lr": 0.2967164223752354, "epoch": 0.1304570884127721, "percentage": 6.68, "elapsed_time": "2:46:00", "remaining_time": "1 day, 14:41:00", "throughput": 340.32, "total_tokens": 3389728} {"current_steps": 2675, "total_steps": 40000, "loss": 0.1028, "lr": 0.2967041534945035, "epoch": 0.13070139007646642, "percentage": 6.69, "elapsed_time": "2:46:03", "remaining_time": "1 day, 14:37:04", "throughput": 340.86, "total_tokens": 3396192} {"current_steps": 2680, "total_steps": 40000, "loss": 0.0824, "lr": 0.2966918619901476, "epoch": 0.13094569174016074, "percentage": 6.7, "elapsed_time": "2:46:06", "remaining_time": "1 day, 14:33:10", "throughput": 341.4, "total_tokens": 3402656} {"current_steps": 2685, "total_steps": 40000, "loss": 0.096, "lr": 0.2966795478640631, "epoch": 0.1311899934038551, "percentage": 6.71, "elapsed_time": "2:46:09", "remaining_time": "1 day, 14:29:16", "throughput": 341.95, "total_tokens": 3409152} {"current_steps": 2690, "total_steps": 40000, "loss": 0.0759, "lr": 0.29666721111814903, "epoch": 0.13143429506754942, "percentage": 6.73, "elapsed_time": "2:46:12", "remaining_time": "1 day, 14:25:23", "throughput": 342.49, "total_tokens": 3415616} {"current_steps": 2695, "total_steps": 40000, "loss": 0.0775, "lr": 0.2966548517543079, "epoch": 0.13167859673124374, "percentage": 6.74, "elapsed_time": "2:46:16", "remaining_time": "1 day, 14:21:31", "throughput": 343.04, "total_tokens": 3422208} {"current_steps": 2700, "total_steps": 40000, "loss": 0.0944, "lr": 0.29664246977444564, "epoch": 0.13192289839493807, "percentage": 6.75, "elapsed_time": "2:46:19", "remaining_time": "1 day, 14:17:41", "throughput": 343.63, "total_tokens": 3429120} {"current_steps": 2705, "total_steps": 40000, "loss": 0.0858, "lr": 0.2966300651804717, "epoch": 0.1321672000586324, "percentage": 6.76, "elapsed_time": "2:46:22", "remaining_time": "1 day, 14:13:49", "throughput": 344.14, "total_tokens": 3435264} {"current_steps": 2710, "total_steps": 40000, "loss": 0.0791, "lr": 0.296617637974299, "epoch": 0.13241150172232674, "percentage": 6.78, "elapsed_time": "2:46:25", "remaining_time": "1 day, 14:10:00", "throughput": 344.69, "total_tokens": 3441888} {"current_steps": 2715, "total_steps": 40000, "loss": 0.0639, "lr": 0.2966051881578441, "epoch": 0.13265580338602107, "percentage": 6.79, "elapsed_time": "2:46:28", "remaining_time": "1 day, 14:06:10", "throughput": 345.17, "total_tokens": 3447744} {"current_steps": 2720, "total_steps": 40000, "loss": 0.0687, "lr": 0.29659271573302676, "epoch": 0.1329001050497154, "percentage": 6.8, "elapsed_time": "2:46:31", "remaining_time": "1 day, 14:02:21", "throughput": 345.69, "total_tokens": 3453920} {"current_steps": 2725, "total_steps": 40000, "loss": 0.1034, "lr": 0.2965802207017705, "epoch": 0.1331444067134097, "percentage": 6.81, "elapsed_time": "2:46:34", "remaining_time": "1 day, 13:58:33", "throughput": 346.17, "total_tokens": 3459776} {"current_steps": 2730, "total_steps": 40000, "loss": 0.0809, "lr": 0.2965677030660021, "epoch": 0.13338870837710404, "percentage": 6.83, "elapsed_time": "2:46:37", "remaining_time": "1 day, 13:54:47", "throughput": 346.69, "total_tokens": 3466048} {"current_steps": 2735, "total_steps": 40000, "loss": 0.0799, "lr": 0.2965551628276521, "epoch": 0.1336330100407984, "percentage": 6.84, "elapsed_time": "2:46:40", "remaining_time": "1 day, 13:51:01", "throughput": 347.23, "total_tokens": 3472544} {"current_steps": 2740, "total_steps": 40000, "loss": 0.0889, "lr": 0.29654259998865423, "epoch": 0.1338773117044927, "percentage": 6.85, "elapsed_time": "2:46:43", "remaining_time": "1 day, 13:47:15", "throughput": 347.72, "total_tokens": 3478528} {"current_steps": 2745, "total_steps": 40000, "loss": 0.0848, "lr": 0.2965300145509458, "epoch": 0.13412161336818704, "percentage": 6.86, "elapsed_time": "2:46:46", "remaining_time": "1 day, 13:43:32", "throughput": 348.29, "total_tokens": 3485312} {"current_steps": 2750, "total_steps": 40000, "loss": 0.1001, "lr": 0.2965174065164678, "epoch": 0.13436591503188136, "percentage": 6.88, "elapsed_time": "2:46:50", "remaining_time": "1 day, 13:39:50", "throughput": 348.85, "total_tokens": 3492000} {"current_steps": 2755, "total_steps": 40000, "loss": 0.0989, "lr": 0.2965047758871644, "epoch": 0.13461021669557569, "percentage": 6.89, "elapsed_time": "2:46:53", "remaining_time": "1 day, 13:36:06", "throughput": 349.37, "total_tokens": 3498272} {"current_steps": 2760, "total_steps": 40000, "loss": 0.0987, "lr": 0.2964921226649835, "epoch": 0.13485451835927004, "percentage": 6.9, "elapsed_time": "2:46:56", "remaining_time": "1 day, 13:32:24", "throughput": 349.88, "total_tokens": 3504448} {"current_steps": 2765, "total_steps": 40000, "loss": 0.053, "lr": 0.2964794468518763, "epoch": 0.13509882002296436, "percentage": 6.91, "elapsed_time": "2:46:59", "remaining_time": "1 day, 13:28:44", "throughput": 350.43, "total_tokens": 3511072} {"current_steps": 2770, "total_steps": 40000, "loss": 0.0771, "lr": 0.2964667484497977, "epoch": 0.13534312168665869, "percentage": 6.93, "elapsed_time": "2:47:02", "remaining_time": "1 day, 13:25:05", "throughput": 351.02, "total_tokens": 3518048} {"current_steps": 2775, "total_steps": 40000, "loss": 0.1009, "lr": 0.29645402746070587, "epoch": 0.135587423350353, "percentage": 6.94, "elapsed_time": "2:47:05", "remaining_time": "1 day, 13:21:25", "throughput": 351.53, "total_tokens": 3524224} {"current_steps": 2780, "total_steps": 40000, "loss": 0.0699, "lr": 0.2964412838865625, "epoch": 0.13583172501404733, "percentage": 6.95, "elapsed_time": "2:47:08", "remaining_time": "1 day, 13:17:46", "throughput": 352.03, "total_tokens": 3530304} {"current_steps": 2785, "total_steps": 40000, "loss": 0.1188, "lr": 0.29642851772933293, "epoch": 0.13607602667774168, "percentage": 6.96, "elapsed_time": "2:47:11", "remaining_time": "1 day, 13:14:09", "throughput": 352.54, "total_tokens": 3536544} {"current_steps": 2790, "total_steps": 40000, "loss": 0.0764, "lr": 0.29641572899098567, "epoch": 0.136320328341436, "percentage": 6.98, "elapsed_time": "2:47:14", "remaining_time": "1 day, 13:10:33", "throughput": 353.09, "total_tokens": 3543168} {"current_steps": 2795, "total_steps": 40000, "loss": 0.0697, "lr": 0.29640291767349314, "epoch": 0.13656463000513033, "percentage": 6.99, "elapsed_time": "2:47:18", "remaining_time": "1 day, 13:06:58", "throughput": 353.67, "total_tokens": 3550144} {"current_steps": 2800, "total_steps": 40000, "loss": 0.0682, "lr": 0.2963900837788308, "epoch": 0.13680893166882466, "percentage": 7.0, "elapsed_time": "2:47:21", "remaining_time": "1 day, 13:03:22", "throughput": 354.17, "total_tokens": 3556256} {"current_steps": 2800, "total_steps": 40000, "eval_loss": 0.08693277835845947, "epoch": 0.13680893166882466, "percentage": 7.0, "elapsed_time": "2:57:59", "remaining_time": "1 day, 15:24:46", "throughput": 332.99, "total_tokens": 3556256} {"current_steps": 2805, "total_steps": 40000, "loss": 0.0831, "lr": 0.2963772273089779, "epoch": 0.13705323333251898, "percentage": 7.01, "elapsed_time": "2:58:03", "remaining_time": "1 day, 15:21:04", "throughput": 333.46, "total_tokens": 3562464} {"current_steps": 2810, "total_steps": 40000, "loss": 0.0807, "lr": 0.2963643482659171, "epoch": 0.13729753499621333, "percentage": 7.03, "elapsed_time": "2:58:06", "remaining_time": "1 day, 15:17:14", "throughput": 333.96, "total_tokens": 3568864} {"current_steps": 2815, "total_steps": 40000, "loss": 0.0665, "lr": 0.2963514466516345, "epoch": 0.13754183665990766, "percentage": 7.04, "elapsed_time": "2:58:09", "remaining_time": "1 day, 15:13:24", "throughput": 334.45, "total_tokens": 3575072} {"current_steps": 2820, "total_steps": 40000, "loss": 0.0994, "lr": 0.2963385224681196, "epoch": 0.13778613832360198, "percentage": 7.05, "elapsed_time": "2:58:12", "remaining_time": "1 day, 15:09:35", "throughput": 334.94, "total_tokens": 3581408} {"current_steps": 2825, "total_steps": 40000, "loss": 0.0503, "lr": 0.29632557571736556, "epoch": 0.1380304399872963, "percentage": 7.06, "elapsed_time": "2:58:15", "remaining_time": "1 day, 15:05:48", "throughput": 335.47, "total_tokens": 3588096} {"current_steps": 2830, "total_steps": 40000, "loss": 0.1201, "lr": 0.2963126064013689, "epoch": 0.13827474165099066, "percentage": 7.07, "elapsed_time": "2:58:18", "remaining_time": "1 day, 15:02:00", "throughput": 335.95, "total_tokens": 3594240} {"current_steps": 2835, "total_steps": 40000, "loss": 0.0802, "lr": 0.29629961452212966, "epoch": 0.13851904331468498, "percentage": 7.09, "elapsed_time": "2:58:21", "remaining_time": "1 day, 14:58:14", "throughput": 336.46, "total_tokens": 3600704} {"current_steps": 2840, "total_steps": 40000, "loss": 0.0918, "lr": 0.2962866000816513, "epoch": 0.1387633449783793, "percentage": 7.1, "elapsed_time": "2:58:24", "remaining_time": "1 day, 14:54:28", "throughput": 336.93, "total_tokens": 3606816} {"current_steps": 2845, "total_steps": 40000, "loss": 0.0638, "lr": 0.2962735630819409, "epoch": 0.13900764664207363, "percentage": 7.11, "elapsed_time": "2:58:28", "remaining_time": "1 day, 14:50:45", "throughput": 337.46, "total_tokens": 3613504} {"current_steps": 2850, "total_steps": 40000, "loss": 0.0548, "lr": 0.2962605035250089, "epoch": 0.13925194830576795, "percentage": 7.12, "elapsed_time": "2:58:31", "remaining_time": "1 day, 14:47:00", "throughput": 337.93, "total_tokens": 3619616} {"current_steps": 2855, "total_steps": 40000, "loss": 0.0505, "lr": 0.29624742141286914, "epoch": 0.1394962499694623, "percentage": 7.14, "elapsed_time": "2:58:34", "remaining_time": "1 day, 14:43:18", "throughput": 338.46, "total_tokens": 3626368} {"current_steps": 2860, "total_steps": 40000, "loss": 0.0418, "lr": 0.29623431674753925, "epoch": 0.13974055163315663, "percentage": 7.15, "elapsed_time": "2:58:37", "remaining_time": "1 day, 14:39:36", "throughput": 338.97, "total_tokens": 3632928} {"current_steps": 2865, "total_steps": 40000, "loss": 0.0972, "lr": 0.29622118953103993, "epoch": 0.13998485329685095, "percentage": 7.16, "elapsed_time": "2:58:40", "remaining_time": "1 day, 14:35:53", "throughput": 339.45, "total_tokens": 3639008} {"current_steps": 2870, "total_steps": 40000, "loss": 0.1157, "lr": 0.2962080397653957, "epoch": 0.14022915496054528, "percentage": 7.17, "elapsed_time": "2:58:43", "remaining_time": "1 day, 14:32:12", "throughput": 339.93, "total_tokens": 3645184} {"current_steps": 2875, "total_steps": 40000, "loss": 0.1054, "lr": 0.29619486745263435, "epoch": 0.1404734566242396, "percentage": 7.19, "elapsed_time": "2:58:46", "remaining_time": "1 day, 14:28:32", "throughput": 340.4, "total_tokens": 3651264} {"current_steps": 2880, "total_steps": 40000, "loss": 0.0781, "lr": 0.2961816725947873, "epoch": 0.14071775828793395, "percentage": 7.2, "elapsed_time": "2:58:49", "remaining_time": "1 day, 14:24:52", "throughput": 340.89, "total_tokens": 3657664} {"current_steps": 2885, "total_steps": 40000, "loss": 0.0807, "lr": 0.29616845519388924, "epoch": 0.14096205995162828, "percentage": 7.21, "elapsed_time": "2:58:52", "remaining_time": "1 day, 14:21:14", "throughput": 341.38, "total_tokens": 3663968} {"current_steps": 2890, "total_steps": 40000, "loss": 0.0688, "lr": 0.2961552152519785, "epoch": 0.1412063616153226, "percentage": 7.22, "elapsed_time": "2:58:55", "remaining_time": "1 day, 14:17:37", "throughput": 341.89, "total_tokens": 3670464} {"current_steps": 2895, "total_steps": 40000, "loss": 0.0684, "lr": 0.29614195277109695, "epoch": 0.14145066327901692, "percentage": 7.24, "elapsed_time": "2:58:58", "remaining_time": "1 day, 14:13:58", "throughput": 342.33, "total_tokens": 3676256} {"current_steps": 2900, "total_steps": 40000, "loss": 0.0529, "lr": 0.2961286677532897, "epoch": 0.14169496494271125, "percentage": 7.25, "elapsed_time": "2:59:01", "remaining_time": "1 day, 14:10:22", "throughput": 342.84, "total_tokens": 3682720} {"current_steps": 2905, "total_steps": 40000, "loss": 0.1004, "lr": 0.2961153602006055, "epoch": 0.1419392666064056, "percentage": 7.26, "elapsed_time": "2:59:04", "remaining_time": "1 day, 14:06:46", "throughput": 343.31, "total_tokens": 3688896} {"current_steps": 2910, "total_steps": 40000, "loss": 0.1031, "lr": 0.29610203011509656, "epoch": 0.14218356827009992, "percentage": 7.27, "elapsed_time": "2:59:08", "remaining_time": "1 day, 14:03:11", "throughput": 343.79, "total_tokens": 3695040} {"current_steps": 2915, "total_steps": 40000, "loss": 0.1165, "lr": 0.29608867749881856, "epoch": 0.14242786993379425, "percentage": 7.29, "elapsed_time": "2:59:10", "remaining_time": "1 day, 13:59:34", "throughput": 344.22, "total_tokens": 3700672} {"current_steps": 2920, "total_steps": 40000, "loss": 0.0758, "lr": 0.29607530235383067, "epoch": 0.14267217159748857, "percentage": 7.3, "elapsed_time": "2:59:14", "remaining_time": "1 day, 13:56:01", "throughput": 344.69, "total_tokens": 3706816} {"current_steps": 2925, "total_steps": 40000, "loss": 0.0799, "lr": 0.2960619046821954, "epoch": 0.1429164732611829, "percentage": 7.31, "elapsed_time": "2:59:17", "remaining_time": "1 day, 13:52:28", "throughput": 345.17, "total_tokens": 3712992} {"current_steps": 2930, "total_steps": 40000, "loss": 0.0666, "lr": 0.2960484844859789, "epoch": 0.14316077492487725, "percentage": 7.32, "elapsed_time": "2:59:20", "remaining_time": "1 day, 13:48:55", "throughput": 345.62, "total_tokens": 3718944} {"current_steps": 2935, "total_steps": 40000, "loss": 0.0801, "lr": 0.29603504176725076, "epoch": 0.14340507658857157, "percentage": 7.34, "elapsed_time": "2:59:23", "remaining_time": "1 day, 13:45:25", "throughput": 346.15, "total_tokens": 3725696} {"current_steps": 2940, "total_steps": 40000, "loss": 0.0871, "lr": 0.296021576528084, "epoch": 0.1436493782522659, "percentage": 7.35, "elapsed_time": "2:59:26", "remaining_time": "1 day, 13:41:55", "throughput": 346.65, "total_tokens": 3732192} {"current_steps": 2945, "total_steps": 40000, "loss": 0.0765, "lr": 0.29600808877055507, "epoch": 0.14389367991596022, "percentage": 7.36, "elapsed_time": "2:59:29", "remaining_time": "1 day, 13:38:25", "throughput": 347.14, "total_tokens": 3738560} {"current_steps": 2950, "total_steps": 40000, "loss": 0.0742, "lr": 0.29599457849674404, "epoch": 0.14413798157965454, "percentage": 7.38, "elapsed_time": "2:59:32", "remaining_time": "1 day, 13:34:55", "throughput": 347.62, "total_tokens": 3744768} {"current_steps": 2955, "total_steps": 40000, "loss": 0.0602, "lr": 0.2959810457087343, "epoch": 0.1443822832433489, "percentage": 7.39, "elapsed_time": "2:59:35", "remaining_time": "1 day, 13:31:27", "throughput": 348.14, "total_tokens": 3751392} {"current_steps": 2960, "total_steps": 40000, "loss": 0.0677, "lr": 0.2959674904086128, "epoch": 0.14462658490704322, "percentage": 7.4, "elapsed_time": "2:59:38", "remaining_time": "1 day, 13:28:00", "throughput": 348.65, "total_tokens": 3758080} {"current_steps": 2965, "total_steps": 40000, "loss": 0.0474, "lr": 0.2959539125984699, "epoch": 0.14487088657073754, "percentage": 7.41, "elapsed_time": "2:59:41", "remaining_time": "1 day, 13:24:33", "throughput": 349.14, "total_tokens": 3764384} {"current_steps": 2970, "total_steps": 40000, "loss": 0.0858, "lr": 0.2959403122803996, "epoch": 0.14511518823443187, "percentage": 7.42, "elapsed_time": "2:59:44", "remaining_time": "1 day, 13:21:07", "throughput": 349.62, "total_tokens": 3770624} {"current_steps": 2975, "total_steps": 40000, "loss": 0.0839, "lr": 0.2959266894564991, "epoch": 0.1453594898981262, "percentage": 7.44, "elapsed_time": "2:59:48", "remaining_time": "1 day, 13:17:41", "throughput": 350.13, "total_tokens": 3777184} {"current_steps": 2980, "total_steps": 40000, "loss": 0.0622, "lr": 0.2959130441288692, "epoch": 0.14560379156182054, "percentage": 7.45, "elapsed_time": "2:59:51", "remaining_time": "1 day, 13:14:17", "throughput": 350.63, "total_tokens": 3783776} {"current_steps": 2985, "total_steps": 40000, "loss": 0.0518, "lr": 0.2958993762996143, "epoch": 0.14584809322551487, "percentage": 7.46, "elapsed_time": "2:59:54", "remaining_time": "1 day, 13:10:53", "throughput": 351.16, "total_tokens": 3790528} {"current_steps": 2990, "total_steps": 40000, "loss": 0.1263, "lr": 0.2958856859708421, "epoch": 0.1460923948892092, "percentage": 7.47, "elapsed_time": "2:59:57", "remaining_time": "1 day, 13:07:31", "throughput": 351.67, "total_tokens": 3797120} {"current_steps": 2995, "total_steps": 40000, "loss": 0.1134, "lr": 0.2958719731446638, "epoch": 0.14633669655290352, "percentage": 7.49, "elapsed_time": "3:00:00", "remaining_time": "1 day, 13:04:07", "throughput": 352.14, "total_tokens": 3803328} {"current_steps": 3000, "total_steps": 40000, "loss": 0.1001, "lr": 0.29585823782319404, "epoch": 0.14658099821659787, "percentage": 7.5, "elapsed_time": "3:00:03", "remaining_time": "1 day, 13:00:44", "throughput": 352.62, "total_tokens": 3809536} {"current_steps": 3000, "total_steps": 40000, "eval_loss": 0.09068971127271652, "epoch": 0.14658099821659787, "percentage": 7.5, "elapsed_time": "3:10:42", "remaining_time": "1 day, 15:12:02", "throughput": 332.93, "total_tokens": 3809536} {"current_steps": 3005, "total_steps": 40000, "loss": 0.0981, "lr": 0.2958444800085511, "epoch": 0.1468252998802922, "percentage": 7.51, "elapsed_time": "3:10:46", "remaining_time": "1 day, 15:08:34", "throughput": 333.35, "total_tokens": 3815552} {"current_steps": 3010, "total_steps": 40000, "loss": 0.0918, "lr": 0.2958306997028565, "epoch": 0.14706960154398652, "percentage": 7.52, "elapsed_time": "3:10:49", "remaining_time": "1 day, 15:04:59", "throughput": 333.83, "total_tokens": 3822144} {"current_steps": 3015, "total_steps": 40000, "loss": 0.0753, "lr": 0.2958168969082354, "epoch": 0.14731390320768084, "percentage": 7.54, "elapsed_time": "3:10:52", "remaining_time": "1 day, 15:01:24", "throughput": 334.26, "total_tokens": 3828032} {"current_steps": 3020, "total_steps": 40000, "loss": 0.0618, "lr": 0.2958030716268164, "epoch": 0.14755820487137516, "percentage": 7.55, "elapsed_time": "3:10:55", "remaining_time": "1 day, 14:57:49", "throughput": 334.7, "total_tokens": 3834016} {"current_steps": 3025, "total_steps": 40000, "loss": 0.0462, "lr": 0.2957892238607314, "epoch": 0.14780250653506952, "percentage": 7.56, "elapsed_time": "3:10:58", "remaining_time": "1 day, 14:54:17", "throughput": 335.2, "total_tokens": 3840896} {"current_steps": 3030, "total_steps": 40000, "loss": 0.0469, "lr": 0.2957753536121161, "epoch": 0.14804680819876384, "percentage": 7.58, "elapsed_time": "3:11:01", "remaining_time": "1 day, 14:50:45", "throughput": 335.68, "total_tokens": 3847360} {"current_steps": 3035, "total_steps": 40000, "loss": 0.0821, "lr": 0.29576146088310923, "epoch": 0.14829110986245816, "percentage": 7.59, "elapsed_time": "3:11:04", "remaining_time": "1 day, 14:47:14", "throughput": 336.17, "total_tokens": 3854080} {"current_steps": 3040, "total_steps": 40000, "loss": 0.0785, "lr": 0.2957475456758533, "epoch": 0.1485354115261525, "percentage": 7.6, "elapsed_time": "3:11:07", "remaining_time": "1 day, 14:43:44", "throughput": 336.66, "total_tokens": 3860736} {"current_steps": 3045, "total_steps": 40000, "loss": 0.0878, "lr": 0.2957336079924944, "epoch": 0.1487797131898468, "percentage": 7.61, "elapsed_time": "3:11:10", "remaining_time": "1 day, 14:40:14", "throughput": 337.13, "total_tokens": 3867168} {"current_steps": 3050, "total_steps": 40000, "loss": 0.0853, "lr": 0.2957196478351816, "epoch": 0.14902401485354116, "percentage": 7.62, "elapsed_time": "3:11:13", "remaining_time": "1 day, 14:36:44", "throughput": 337.57, "total_tokens": 3873216} {"current_steps": 3055, "total_steps": 40000, "loss": 0.0822, "lr": 0.295705665206068, "epoch": 0.1492683165172355, "percentage": 7.64, "elapsed_time": "3:11:16", "remaining_time": "1 day, 14:33:14", "throughput": 337.99, "total_tokens": 3879072} {"current_steps": 3060, "total_steps": 40000, "loss": 0.0621, "lr": 0.2956916601073097, "epoch": 0.1495126181809298, "percentage": 7.65, "elapsed_time": "3:11:20", "remaining_time": "1 day, 14:29:47", "throughput": 338.49, "total_tokens": 3885920} {"current_steps": 3065, "total_steps": 40000, "loss": 0.0894, "lr": 0.29567763254106655, "epoch": 0.14975691984462414, "percentage": 7.66, "elapsed_time": "3:11:23", "remaining_time": "1 day, 14:26:19", "throughput": 338.95, "total_tokens": 3892224} {"current_steps": 3070, "total_steps": 40000, "loss": 0.0761, "lr": 0.29566358250950175, "epoch": 0.15000122150831846, "percentage": 7.67, "elapsed_time": "3:11:26", "remaining_time": "1 day, 14:22:51", "throughput": 339.37, "total_tokens": 3898112} {"current_steps": 3075, "total_steps": 40000, "loss": 0.1097, "lr": 0.295649510014782, "epoch": 0.1502455231720128, "percentage": 7.69, "elapsed_time": "3:11:29", "remaining_time": "1 day, 14:19:25", "throughput": 339.84, "total_tokens": 3904576} {"current_steps": 3080, "total_steps": 40000, "loss": 0.068, "lr": 0.2956354150590775, "epoch": 0.15048982483570714, "percentage": 7.7, "elapsed_time": "3:11:32", "remaining_time": "1 day, 14:16:00", "throughput": 340.32, "total_tokens": 3911072} {"current_steps": 3085, "total_steps": 40000, "loss": 0.0609, "lr": 0.2956212976445618, "epoch": 0.15073412649940146, "percentage": 7.71, "elapsed_time": "3:11:35", "remaining_time": "1 day, 14:12:36", "throughput": 340.79, "total_tokens": 3917568} {"current_steps": 3090, "total_steps": 40000, "loss": 0.0874, "lr": 0.295607157773412, "epoch": 0.15097842816309578, "percentage": 7.72, "elapsed_time": "3:11:38", "remaining_time": "1 day, 14:09:11", "throughput": 341.24, "total_tokens": 3923840} {"current_steps": 3095, "total_steps": 40000, "loss": 0.1116, "lr": 0.2955929954478087, "epoch": 0.1512227298267901, "percentage": 7.74, "elapsed_time": "3:11:41", "remaining_time": "1 day, 14:05:47", "throughput": 341.68, "total_tokens": 3929952} {"current_steps": 3100, "total_steps": 40000, "loss": 0.1126, "lr": 0.29557881066993585, "epoch": 0.15146703149048446, "percentage": 7.75, "elapsed_time": "3:11:44", "remaining_time": "1 day, 14:02:24", "throughput": 342.15, "total_tokens": 3936352} {"current_steps": 3105, "total_steps": 40000, "loss": 0.0794, "lr": 0.29556460344198093, "epoch": 0.15171133315417878, "percentage": 7.76, "elapsed_time": "3:11:47", "remaining_time": "1 day, 13:59:01", "throughput": 342.61, "total_tokens": 3942720} {"current_steps": 3110, "total_steps": 40000, "loss": 0.0642, "lr": 0.29555037376613486, "epoch": 0.1519556348178731, "percentage": 7.78, "elapsed_time": "3:11:51", "remaining_time": "1 day, 13:55:41", "throughput": 343.1, "total_tokens": 3949504} {"current_steps": 3115, "total_steps": 40000, "loss": 0.107, "lr": 0.29553612164459203, "epoch": 0.15219993648156743, "percentage": 7.79, "elapsed_time": "3:11:54", "remaining_time": "1 day, 13:52:19", "throughput": 343.53, "total_tokens": 3955456} {"current_steps": 3120, "total_steps": 40000, "loss": 0.1294, "lr": 0.29552184707955037, "epoch": 0.15244423814526176, "percentage": 7.8, "elapsed_time": "3:11:57", "remaining_time": "1 day, 13:48:59", "throughput": 344.0, "total_tokens": 3961920} {"current_steps": 3125, "total_steps": 40000, "loss": 0.1018, "lr": 0.29550755007321117, "epoch": 0.1526885398089561, "percentage": 7.81, "elapsed_time": "3:12:00", "remaining_time": "1 day, 13:45:39", "throughput": 344.45, "total_tokens": 3968160} {"current_steps": 3130, "total_steps": 40000, "loss": 0.0901, "lr": 0.29549323062777916, "epoch": 0.15293284147265043, "percentage": 7.83, "elapsed_time": "3:12:03", "remaining_time": "1 day, 13:42:20", "throughput": 344.92, "total_tokens": 3974592} {"current_steps": 3135, "total_steps": 40000, "loss": 0.0664, "lr": 0.29547888874546263, "epoch": 0.15317714313634476, "percentage": 7.84, "elapsed_time": "3:12:06", "remaining_time": "1 day, 13:39:00", "throughput": 345.36, "total_tokens": 3980768} {"current_steps": 3140, "total_steps": 40000, "loss": 0.0831, "lr": 0.2954645244284732, "epoch": 0.15342144480003908, "percentage": 7.85, "elapsed_time": "3:12:09", "remaining_time": "1 day, 13:35:43", "throughput": 345.84, "total_tokens": 3987424} {"current_steps": 3145, "total_steps": 40000, "loss": 0.0656, "lr": 0.2954501376790261, "epoch": 0.1536657464637334, "percentage": 7.86, "elapsed_time": "3:12:12", "remaining_time": "1 day, 13:32:26", "throughput": 346.3, "total_tokens": 3993792} {"current_steps": 3150, "total_steps": 40000, "loss": 0.0709, "lr": 0.29543572849933997, "epoch": 0.15391004812742776, "percentage": 7.88, "elapsed_time": "3:12:15", "remaining_time": "1 day, 13:29:08", "throughput": 346.73, "total_tokens": 3999776} {"current_steps": 3155, "total_steps": 40000, "loss": 0.0865, "lr": 0.2954212968916368, "epoch": 0.15415434979112208, "percentage": 7.89, "elapsed_time": "3:12:18", "remaining_time": "1 day, 13:25:52", "throughput": 347.18, "total_tokens": 4006016} {"current_steps": 3160, "total_steps": 40000, "loss": 0.0844, "lr": 0.29540684285814217, "epoch": 0.1543986514548164, "percentage": 7.9, "elapsed_time": "3:12:21", "remaining_time": "1 day, 13:22:36", "throughput": 347.62, "total_tokens": 4012192} {"current_steps": 3165, "total_steps": 40000, "loss": 0.0847, "lr": 0.2953923664010851, "epoch": 0.15464295311851073, "percentage": 7.91, "elapsed_time": "3:12:24", "remaining_time": "1 day, 13:19:20", "throughput": 348.06, "total_tokens": 4018336} {"current_steps": 3170, "total_steps": 40000, "loss": 0.0643, "lr": 0.295377867522698, "epoch": 0.15488725478220508, "percentage": 7.92, "elapsed_time": "3:12:27", "remaining_time": "1 day, 13:16:07", "throughput": 348.55, "total_tokens": 4025024} {"current_steps": 3175, "total_steps": 40000, "loss": 0.103, "lr": 0.2953633462252168, "epoch": 0.1551315564458994, "percentage": 7.94, "elapsed_time": "3:12:31", "remaining_time": "1 day, 13:12:53", "throughput": 348.99, "total_tokens": 4031136} {"current_steps": 3180, "total_steps": 40000, "loss": 0.0768, "lr": 0.2953488025108809, "epoch": 0.15537585810959373, "percentage": 7.95, "elapsed_time": "3:12:34", "remaining_time": "1 day, 13:09:40", "throughput": 349.43, "total_tokens": 4037312} {"current_steps": 3185, "total_steps": 40000, "loss": 0.0531, "lr": 0.295334236381933, "epoch": 0.15562015977328805, "percentage": 7.96, "elapsed_time": "3:12:37", "remaining_time": "1 day, 13:06:29", "throughput": 349.94, "total_tokens": 4044384} {"current_steps": 3190, "total_steps": 40000, "loss": 0.0651, "lr": 0.29531964784061954, "epoch": 0.15586446143698238, "percentage": 7.98, "elapsed_time": "3:12:40", "remaining_time": "1 day, 13:03:17", "throughput": 350.38, "total_tokens": 4050560} {"current_steps": 3195, "total_steps": 40000, "loss": 0.0807, "lr": 0.2953050368891902, "epoch": 0.15610876310067673, "percentage": 7.99, "elapsed_time": "3:12:43", "remaining_time": "1 day, 13:00:07", "throughput": 350.92, "total_tokens": 4057952} {"current_steps": 3200, "total_steps": 40000, "loss": 0.112, "lr": 0.29529040352989805, "epoch": 0.15635306476437105, "percentage": 8.0, "elapsed_time": "3:12:46", "remaining_time": "1 day, 12:56:57", "throughput": 351.37, "total_tokens": 4064256} {"current_steps": 3200, "total_steps": 40000, "eval_loss": 0.08372149616479874, "epoch": 0.15635306476437105, "percentage": 8.0, "elapsed_time": "3:23:26", "remaining_time": "1 day, 14:59:33", "throughput": 332.96, "total_tokens": 4064256} {"current_steps": 3205, "total_steps": 40000, "loss": 0.1155, "lr": 0.29527574776499993, "epoch": 0.15659736642806538, "percentage": 8.01, "elapsed_time": "3:23:30", "remaining_time": "1 day, 14:56:23", "throughput": 333.37, "total_tokens": 4070656} {"current_steps": 3210, "total_steps": 40000, "loss": 0.1261, "lr": 0.2952610695967558, "epoch": 0.1568416680917597, "percentage": 8.03, "elapsed_time": "3:23:33", "remaining_time": "1 day, 14:53:01", "throughput": 333.8, "total_tokens": 4076864} {"current_steps": 3215, "total_steps": 40000, "loss": 0.0701, "lr": 0.29524636902742935, "epoch": 0.15708596975545402, "percentage": 8.04, "elapsed_time": "3:23:36", "remaining_time": "1 day, 14:49:41", "throughput": 334.28, "total_tokens": 4083840} {"current_steps": 3220, "total_steps": 40000, "loss": 0.0961, "lr": 0.2952316460592875, "epoch": 0.15733027141914838, "percentage": 8.05, "elapsed_time": "3:23:39", "remaining_time": "1 day, 14:46:20", "throughput": 334.72, "total_tokens": 4090240} {"current_steps": 3225, "total_steps": 40000, "loss": 0.1405, "lr": 0.29521690069460066, "epoch": 0.1575745730828427, "percentage": 8.06, "elapsed_time": "3:23:43", "remaining_time": "1 day, 14:43:00", "throughput": 335.14, "total_tokens": 4096416} {"current_steps": 3230, "total_steps": 40000, "loss": 0.0692, "lr": 0.29520213293564285, "epoch": 0.15781887474653702, "percentage": 8.08, "elapsed_time": "3:23:46", "remaining_time": "1 day, 14:39:41", "throughput": 335.59, "total_tokens": 4102944} {"current_steps": 3235, "total_steps": 40000, "loss": 0.0784, "lr": 0.29518734278469144, "epoch": 0.15806317641023135, "percentage": 8.09, "elapsed_time": "3:23:49", "remaining_time": "1 day, 14:36:22", "throughput": 336.03, "total_tokens": 4109408} {"current_steps": 3240, "total_steps": 40000, "loss": 0.0739, "lr": 0.29517253024402723, "epoch": 0.15830747807392567, "percentage": 8.1, "elapsed_time": "3:23:52", "remaining_time": "1 day, 14:33:02", "throughput": 336.44, "total_tokens": 4115392} {"current_steps": 3245, "total_steps": 40000, "loss": 0.0585, "lr": 0.2951576953159345, "epoch": 0.15855177973762002, "percentage": 8.11, "elapsed_time": "3:23:55", "remaining_time": "1 day, 14:29:44", "throughput": 336.87, "total_tokens": 4121728} {"current_steps": 3250, "total_steps": 40000, "loss": 0.0851, "lr": 0.29514283800270097, "epoch": 0.15879608140131435, "percentage": 8.12, "elapsed_time": "3:23:58", "remaining_time": "1 day, 14:26:27", "throughput": 337.32, "total_tokens": 4128256} {"current_steps": 3255, "total_steps": 40000, "loss": 0.0586, "lr": 0.2951279583066179, "epoch": 0.15904038306500867, "percentage": 8.14, "elapsed_time": "3:24:01", "remaining_time": "1 day, 14:23:12", "throughput": 337.8, "total_tokens": 4135168} {"current_steps": 3260, "total_steps": 40000, "loss": 0.0645, "lr": 0.2951130562299798, "epoch": 0.159284684728703, "percentage": 8.15, "elapsed_time": "3:24:04", "remaining_time": "1 day, 14:19:56", "throughput": 338.24, "total_tokens": 4141632} {"current_steps": 3265, "total_steps": 40000, "loss": 0.0642, "lr": 0.29509813177508487, "epoch": 0.15952898639239732, "percentage": 8.16, "elapsed_time": "3:24:07", "remaining_time": "1 day, 14:16:43", "throughput": 338.73, "total_tokens": 4148736} {"current_steps": 3270, "total_steps": 40000, "loss": 0.0943, "lr": 0.2950831849442346, "epoch": 0.15977328805609167, "percentage": 8.18, "elapsed_time": "3:24:11", "remaining_time": "1 day, 14:13:28", "throughput": 339.17, "total_tokens": 4155168} {"current_steps": 3275, "total_steps": 40000, "loss": 0.0837, "lr": 0.2950682157397339, "epoch": 0.160017589719786, "percentage": 8.19, "elapsed_time": "3:24:14", "remaining_time": "1 day, 14:10:13", "throughput": 339.6, "total_tokens": 4161440} {"current_steps": 3280, "total_steps": 40000, "loss": 0.0637, "lr": 0.2950532241638914, "epoch": 0.16026189138348032, "percentage": 8.2, "elapsed_time": "3:24:17", "remaining_time": "1 day, 14:07:00", "throughput": 340.03, "total_tokens": 4167840} {"current_steps": 3285, "total_steps": 40000, "loss": 0.1072, "lr": 0.2950382102190188, "epoch": 0.16050619304717464, "percentage": 8.21, "elapsed_time": "3:24:20", "remaining_time": "1 day, 14:03:47", "throughput": 340.46, "total_tokens": 4174112} {"current_steps": 3290, "total_steps": 40000, "loss": 0.0695, "lr": 0.2950231739074316, "epoch": 0.16075049471086897, "percentage": 8.22, "elapsed_time": "3:24:23", "remaining_time": "1 day, 14:00:34", "throughput": 340.86, "total_tokens": 4180032} {"current_steps": 3295, "total_steps": 40000, "loss": 0.1006, "lr": 0.29500811523144843, "epoch": 0.16099479637456332, "percentage": 8.24, "elapsed_time": "3:24:26", "remaining_time": "1 day, 13:57:21", "throughput": 341.26, "total_tokens": 4186016} {"current_steps": 3300, "total_steps": 40000, "loss": 0.0844, "lr": 0.2949930341933917, "epoch": 0.16123909803825764, "percentage": 8.25, "elapsed_time": "3:24:29", "remaining_time": "1 day, 13:54:10", "throughput": 341.67, "total_tokens": 4192128} {"current_steps": 3305, "total_steps": 40000, "loss": 0.0992, "lr": 0.29497793079558693, "epoch": 0.16148339970195197, "percentage": 8.26, "elapsed_time": "3:24:32", "remaining_time": "1 day, 13:51:01", "throughput": 342.15, "total_tokens": 4199072} {"current_steps": 3310, "total_steps": 40000, "loss": 0.1086, "lr": 0.2949628050403633, "epoch": 0.1617277013656463, "percentage": 8.28, "elapsed_time": "3:24:35", "remaining_time": "1 day, 13:47:50", "throughput": 342.56, "total_tokens": 4205088} {"current_steps": 3315, "total_steps": 40000, "loss": 0.0722, "lr": 0.2949476569300535, "epoch": 0.16197200302934062, "percentage": 8.29, "elapsed_time": "3:24:38", "remaining_time": "1 day, 13:44:40", "throughput": 342.96, "total_tokens": 4211136} {"current_steps": 3320, "total_steps": 40000, "loss": 0.0921, "lr": 0.29493248646699344, "epoch": 0.16221630469303497, "percentage": 8.3, "elapsed_time": "3:24:41", "remaining_time": "1 day, 13:41:30", "throughput": 343.38, "total_tokens": 4217280} {"current_steps": 3325, "total_steps": 40000, "loss": 0.0715, "lr": 0.29491729365352265, "epoch": 0.1624606063567293, "percentage": 8.31, "elapsed_time": "3:24:44", "remaining_time": "1 day, 13:38:23", "throughput": 343.85, "total_tokens": 4224128} {"current_steps": 3330, "total_steps": 40000, "loss": 0.0903, "lr": 0.29490207849198397, "epoch": 0.16270490802042362, "percentage": 8.33, "elapsed_time": "3:24:47", "remaining_time": "1 day, 13:35:15", "throughput": 344.27, "total_tokens": 4230368} {"current_steps": 3335, "total_steps": 40000, "loss": 0.1033, "lr": 0.29488684098472384, "epoch": 0.16294920968411794, "percentage": 8.34, "elapsed_time": "3:24:51", "remaining_time": "1 day, 13:32:08", "throughput": 344.73, "total_tokens": 4237088} {"current_steps": 3340, "total_steps": 40000, "loss": 0.0665, "lr": 0.2948715811340921, "epoch": 0.1631935113478123, "percentage": 8.35, "elapsed_time": "3:24:54", "remaining_time": "1 day, 13:29:01", "throughput": 345.17, "total_tokens": 4243552} {"current_steps": 3345, "total_steps": 40000, "loss": 0.0755, "lr": 0.294856298942442, "epoch": 0.16343781301150662, "percentage": 8.36, "elapsed_time": "3:24:57", "remaining_time": "1 day, 13:25:56", "throughput": 345.6, "total_tokens": 4249952} {"current_steps": 3350, "total_steps": 40000, "loss": 0.1073, "lr": 0.2948409944121302, "epoch": 0.16368211467520094, "percentage": 8.38, "elapsed_time": "3:25:00", "remaining_time": "1 day, 13:22:48", "throughput": 345.97, "total_tokens": 4255584} {"current_steps": 3355, "total_steps": 40000, "loss": 0.0916, "lr": 0.29482566754551687, "epoch": 0.16392641633889526, "percentage": 8.39, "elapsed_time": "3:25:03", "remaining_time": "1 day, 13:19:43", "throughput": 346.4, "total_tokens": 4261888} {"current_steps": 3360, "total_steps": 40000, "loss": 0.0794, "lr": 0.2948103183449656, "epoch": 0.1641707180025896, "percentage": 8.4, "elapsed_time": "3:25:06", "remaining_time": "1 day, 13:16:39", "throughput": 346.84, "total_tokens": 4268416} {"current_steps": 3365, "total_steps": 40000, "loss": 0.089, "lr": 0.2947949468128435, "epoch": 0.16441501966628394, "percentage": 8.41, "elapsed_time": "3:25:09", "remaining_time": "1 day, 13:13:35", "throughput": 347.27, "total_tokens": 4274752} {"current_steps": 3370, "total_steps": 40000, "loss": 0.1046, "lr": 0.2947795529515209, "epoch": 0.16465932132997826, "percentage": 8.43, "elapsed_time": "3:25:12", "remaining_time": "1 day, 13:10:31", "throughput": 347.69, "total_tokens": 4281056} {"current_steps": 3375, "total_steps": 40000, "loss": 0.0759, "lr": 0.29476413676337193, "epoch": 0.1649036229936726, "percentage": 8.44, "elapsed_time": "3:25:15", "remaining_time": "1 day, 13:07:30", "throughput": 348.17, "total_tokens": 4288000} {"current_steps": 3380, "total_steps": 40000, "loss": 0.0955, "lr": 0.2947486982507738, "epoch": 0.1651479246573669, "percentage": 8.45, "elapsed_time": "3:25:18", "remaining_time": "1 day, 13:04:27", "throughput": 348.61, "total_tokens": 4294464} {"current_steps": 3385, "total_steps": 40000, "loss": 0.0815, "lr": 0.29473323741610735, "epoch": 0.16539222632106124, "percentage": 8.46, "elapsed_time": "3:25:22", "remaining_time": "1 day, 13:01:26", "throughput": 349.03, "total_tokens": 4300800} {"current_steps": 3390, "total_steps": 40000, "loss": 0.0966, "lr": 0.2947177542617569, "epoch": 0.1656365279847556, "percentage": 8.48, "elapsed_time": "3:25:25", "remaining_time": "1 day, 12:58:23", "throughput": 349.45, "total_tokens": 4306944} {"current_steps": 3395, "total_steps": 40000, "loss": 0.1295, "lr": 0.2947022487901101, "epoch": 0.1658808296484499, "percentage": 8.49, "elapsed_time": "3:25:28", "remaining_time": "1 day, 12:55:23", "throughput": 349.88, "total_tokens": 4313344} {"current_steps": 3400, "total_steps": 40000, "loss": 0.1053, "lr": 0.2946867210035581, "epoch": 0.16612513131214424, "percentage": 8.5, "elapsed_time": "3:25:31", "remaining_time": "1 day, 12:52:22", "throughput": 350.31, "total_tokens": 4319712} {"current_steps": 3400, "total_steps": 40000, "eval_loss": 0.0932849794626236, "epoch": 0.16612513131214424, "percentage": 8.5, "elapsed_time": "3:36:10", "remaining_time": "1 day, 14:47:04", "throughput": 333.04, "total_tokens": 4319712} {"current_steps": 3405, "total_steps": 40000, "loss": 0.0817, "lr": 0.2946711709044954, "epoch": 0.16636943297583856, "percentage": 8.51, "elapsed_time": "3:36:14", "remaining_time": "1 day, 14:44:04", "throughput": 333.42, "total_tokens": 4325952} {"current_steps": 3410, "total_steps": 40000, "loss": 0.0569, "lr": 0.2946555984953202, "epoch": 0.16661373463953288, "percentage": 8.53, "elapsed_time": "3:36:17", "remaining_time": "1 day, 14:40:53", "throughput": 333.82, "total_tokens": 4332192} {"current_steps": 3415, "total_steps": 40000, "loss": 0.0726, "lr": 0.2946400037784338, "epoch": 0.16685803630322724, "percentage": 8.54, "elapsed_time": "3:36:20", "remaining_time": "1 day, 14:37:42", "throughput": 334.2, "total_tokens": 4338176} {"current_steps": 3420, "total_steps": 40000, "loss": 0.0938, "lr": 0.29462438675624114, "epoch": 0.16710233796692156, "percentage": 8.55, "elapsed_time": "3:36:23", "remaining_time": "1 day, 14:34:32", "throughput": 334.58, "total_tokens": 4344064} {"current_steps": 3425, "total_steps": 40000, "loss": 0.0601, "lr": 0.2946087474311506, "epoch": 0.16734663963061588, "percentage": 8.56, "elapsed_time": "3:36:26", "remaining_time": "1 day, 14:31:24", "throughput": 334.99, "total_tokens": 4350496} {"current_steps": 3430, "total_steps": 40000, "loss": 0.0769, "lr": 0.294593085805574, "epoch": 0.1675909412943102, "percentage": 8.58, "elapsed_time": "3:36:30", "remaining_time": "1 day, 14:28:16", "throughput": 335.43, "total_tokens": 4357248} {"current_steps": 3435, "total_steps": 40000, "loss": 0.0876, "lr": 0.2945774018819264, "epoch": 0.16783524295800453, "percentage": 8.59, "elapsed_time": "3:36:32", "remaining_time": "1 day, 14:25:07", "throughput": 335.79, "total_tokens": 4362944} {"current_steps": 3440, "total_steps": 40000, "loss": 0.0626, "lr": 0.2945616956626266, "epoch": 0.16807954462169888, "percentage": 8.6, "elapsed_time": "3:36:36", "remaining_time": "1 day, 14:22:00", "throughput": 336.2, "total_tokens": 4369216} {"current_steps": 3445, "total_steps": 40000, "loss": 0.0631, "lr": 0.2945459671500966, "epoch": 0.1683238462853932, "percentage": 8.61, "elapsed_time": "3:36:39", "remaining_time": "1 day, 14:18:54", "throughput": 336.6, "total_tokens": 4375552} {"current_steps": 3450, "total_steps": 40000, "loss": 0.0896, "lr": 0.2945302163467621, "epoch": 0.16856814794908753, "percentage": 8.62, "elapsed_time": "3:36:42", "remaining_time": "1 day, 14:15:47", "throughput": 337.01, "total_tokens": 4381888} {"current_steps": 3455, "total_steps": 40000, "loss": 0.0845, "lr": 0.2945144432550519, "epoch": 0.16881244961278186, "percentage": 8.64, "elapsed_time": "3:36:45", "remaining_time": "1 day, 14:12:43", "throughput": 337.43, "total_tokens": 4388416} {"current_steps": 3460, "total_steps": 40000, "loss": 0.0706, "lr": 0.29449864787739843, "epoch": 0.16905675127647618, "percentage": 8.65, "elapsed_time": "3:36:48", "remaining_time": "1 day, 14:09:38", "throughput": 337.85, "total_tokens": 4394880} {"current_steps": 3465, "total_steps": 40000, "loss": 0.0761, "lr": 0.2944828302162376, "epoch": 0.16930105294017053, "percentage": 8.66, "elapsed_time": "3:36:51", "remaining_time": "1 day, 14:06:34", "throughput": 338.25, "total_tokens": 4401216} {"current_steps": 3470, "total_steps": 40000, "loss": 0.0946, "lr": 0.2944669902740087, "epoch": 0.16954535460386486, "percentage": 8.67, "elapsed_time": "3:36:54", "remaining_time": "1 day, 14:03:30", "throughput": 338.68, "total_tokens": 4407840} {"current_steps": 3475, "total_steps": 40000, "loss": 0.1002, "lr": 0.2944511280531544, "epoch": 0.16978965626755918, "percentage": 8.69, "elapsed_time": "3:36:57", "remaining_time": "1 day, 14:00:27", "throughput": 339.09, "total_tokens": 4414272} {"current_steps": 3480, "total_steps": 40000, "loss": 0.1249, "lr": 0.29443524355612083, "epoch": 0.1700339579312535, "percentage": 8.7, "elapsed_time": "3:37:00", "remaining_time": "1 day, 13:57:24", "throughput": 339.49, "total_tokens": 4420512} {"current_steps": 3485, "total_steps": 40000, "loss": 0.0608, "lr": 0.29441933678535764, "epoch": 0.17027825959494783, "percentage": 8.71, "elapsed_time": "3:37:03", "remaining_time": "1 day, 13:54:21", "throughput": 339.89, "total_tokens": 4426688} {"current_steps": 3490, "total_steps": 40000, "loss": 0.0984, "lr": 0.29440340774331786, "epoch": 0.17052256125864218, "percentage": 8.72, "elapsed_time": "3:37:07", "remaining_time": "1 day, 13:51:19", "throughput": 340.29, "total_tokens": 4432960} {"current_steps": 3495, "total_steps": 40000, "loss": 0.0832, "lr": 0.2943874564324579, "epoch": 0.1707668629223365, "percentage": 8.74, "elapsed_time": "3:37:10", "remaining_time": "1 day, 13:48:18", "throughput": 340.7, "total_tokens": 4439360} {"current_steps": 3500, "total_steps": 40000, "loss": 0.0887, "lr": 0.2943714828552376, "epoch": 0.17101116458603083, "percentage": 8.75, "elapsed_time": "3:37:13", "remaining_time": "1 day, 13:45:17", "throughput": 341.09, "total_tokens": 4445504} {"current_steps": 3505, "total_steps": 40000, "loss": 0.108, "lr": 0.29435548701412045, "epoch": 0.17125546624972515, "percentage": 8.76, "elapsed_time": "3:37:16", "remaining_time": "1 day, 13:42:16", "throughput": 341.48, "total_tokens": 4451680} {"current_steps": 3510, "total_steps": 40000, "loss": 0.0536, "lr": 0.2943394689115731, "epoch": 0.1714997679134195, "percentage": 8.77, "elapsed_time": "3:37:19", "remaining_time": "1 day, 13:39:16", "throughput": 341.89, "total_tokens": 4457984} {"current_steps": 3515, "total_steps": 40000, "loss": 0.0849, "lr": 0.29432342855006577, "epoch": 0.17174406957711383, "percentage": 8.79, "elapsed_time": "3:37:22", "remaining_time": "1 day, 13:36:16", "throughput": 342.27, "total_tokens": 4464032} {"current_steps": 3520, "total_steps": 40000, "loss": 0.055, "lr": 0.294307365932072, "epoch": 0.17198837124080815, "percentage": 8.8, "elapsed_time": "3:37:25", "remaining_time": "1 day, 13:33:19", "throughput": 342.73, "total_tokens": 4471040} {"current_steps": 3525, "total_steps": 40000, "loss": 0.0734, "lr": 0.294291281060069, "epoch": 0.17223267290450248, "percentage": 8.81, "elapsed_time": "3:37:28", "remaining_time": "1 day, 13:30:20", "throughput": 343.12, "total_tokens": 4477280} {"current_steps": 3530, "total_steps": 40000, "loss": 0.1052, "lr": 0.29427517393653724, "epoch": 0.1724769745681968, "percentage": 8.82, "elapsed_time": "3:37:31", "remaining_time": "1 day, 13:27:21", "throughput": 343.48, "total_tokens": 4482912} {"current_steps": 3535, "total_steps": 40000, "loss": 0.066, "lr": 0.29425904456396046, "epoch": 0.17272127623189115, "percentage": 8.84, "elapsed_time": "3:37:34", "remaining_time": "1 day, 13:24:23", "throughput": 343.88, "total_tokens": 4489184} {"current_steps": 3540, "total_steps": 40000, "loss": 0.0535, "lr": 0.2942428929448262, "epoch": 0.17296557789558548, "percentage": 8.85, "elapsed_time": "3:37:37", "remaining_time": "1 day, 13:21:28", "throughput": 344.32, "total_tokens": 4496064} {"current_steps": 3545, "total_steps": 40000, "loss": 0.0794, "lr": 0.2942267190816252, "epoch": 0.1732098795592798, "percentage": 8.86, "elapsed_time": "3:37:40", "remaining_time": "1 day, 13:18:31", "throughput": 344.72, "total_tokens": 4502304} {"current_steps": 3550, "total_steps": 40000, "loss": 0.0559, "lr": 0.2942105229768516, "epoch": 0.17345418122297412, "percentage": 8.88, "elapsed_time": "3:37:43", "remaining_time": "1 day, 13:15:35", "throughput": 345.14, "total_tokens": 4508896} {"current_steps": 3555, "total_steps": 40000, "loss": 0.0919, "lr": 0.29419430463300306, "epoch": 0.17369848288666845, "percentage": 8.89, "elapsed_time": "3:37:47", "remaining_time": "1 day, 13:12:40", "throughput": 345.55, "total_tokens": 4515264} {"current_steps": 3560, "total_steps": 40000, "loss": 0.0541, "lr": 0.2941780640525808, "epoch": 0.1739427845503628, "percentage": 8.9, "elapsed_time": "3:37:50", "remaining_time": "1 day, 13:09:44", "throughput": 345.94, "total_tokens": 4521408} {"current_steps": 3565, "total_steps": 40000, "loss": 0.1082, "lr": 0.2941618012380891, "epoch": 0.17418708621405712, "percentage": 8.91, "elapsed_time": "3:37:53", "remaining_time": "1 day, 13:06:49", "throughput": 346.33, "total_tokens": 4527552} {"current_steps": 3570, "total_steps": 40000, "loss": 0.0858, "lr": 0.29414551619203605, "epoch": 0.17443138787775145, "percentage": 8.92, "elapsed_time": "3:37:56", "remaining_time": "1 day, 13:03:56", "throughput": 346.74, "total_tokens": 4533984} {"current_steps": 3575, "total_steps": 40000, "loss": 0.1249, "lr": 0.29412920891693295, "epoch": 0.17467568954144577, "percentage": 8.94, "elapsed_time": "3:37:59", "remaining_time": "1 day, 13:01:01", "throughput": 347.12, "total_tokens": 4540032} {"current_steps": 3580, "total_steps": 40000, "loss": 0.0886, "lr": 0.2941128794152946, "epoch": 0.1749199912051401, "percentage": 8.95, "elapsed_time": "3:38:02", "remaining_time": "1 day, 12:58:07", "throughput": 347.49, "total_tokens": 4545984} {"current_steps": 3585, "total_steps": 40000, "loss": 0.0902, "lr": 0.2940965276896392, "epoch": 0.17516429286883445, "percentage": 8.96, "elapsed_time": "3:38:05", "remaining_time": "1 day, 12:55:15", "throughput": 347.91, "total_tokens": 4552448} {"current_steps": 3590, "total_steps": 40000, "loss": 0.0734, "lr": 0.2940801537424884, "epoch": 0.17540859453252877, "percentage": 8.97, "elapsed_time": "3:38:08", "remaining_time": "1 day, 12:52:23", "throughput": 348.31, "total_tokens": 4558784} {"current_steps": 3595, "total_steps": 40000, "loss": 0.0777, "lr": 0.2940637575763673, "epoch": 0.1756528961962231, "percentage": 8.99, "elapsed_time": "3:38:11", "remaining_time": "1 day, 12:49:31", "throughput": 348.71, "total_tokens": 4565056} {"current_steps": 3600, "total_steps": 40000, "loss": 0.0469, "lr": 0.2940473391938043, "epoch": 0.17589719785991742, "percentage": 9.0, "elapsed_time": "3:38:14", "remaining_time": "1 day, 12:46:39", "throughput": 349.09, "total_tokens": 4571104} {"current_steps": 3600, "total_steps": 40000, "eval_loss": 0.08289935439825058, "epoch": 0.17589719785991742, "percentage": 9.0, "elapsed_time": "3:48:53", "remaining_time": "1 day, 14:34:19", "throughput": 332.85, "total_tokens": 4571104} {"current_steps": 3605, "total_steps": 40000, "loss": 0.0588, "lr": 0.29403089859733145, "epoch": 0.17614149952361174, "percentage": 9.01, "elapsed_time": "3:48:57", "remaining_time": "1 day, 14:31:25", "throughput": 333.23, "total_tokens": 4577632} {"current_steps": 3610, "total_steps": 40000, "loss": 0.0885, "lr": 0.294014435789484, "epoch": 0.1763858011873061, "percentage": 9.03, "elapsed_time": "3:49:00", "remaining_time": "1 day, 14:28:24", "throughput": 333.61, "total_tokens": 4583776} {"current_steps": 3615, "total_steps": 40000, "loss": 0.1127, "lr": 0.2939979507728007, "epoch": 0.17663010285100042, "percentage": 9.04, "elapsed_time": "3:49:03", "remaining_time": "1 day, 14:25:24", "throughput": 333.98, "total_tokens": 4589888} {"current_steps": 3620, "total_steps": 40000, "loss": 0.1154, "lr": 0.2939814435498239, "epoch": 0.17687440451469474, "percentage": 9.05, "elapsed_time": "3:49:06", "remaining_time": "1 day, 14:22:26", "throughput": 334.4, "total_tokens": 4596704} {"current_steps": 3625, "total_steps": 40000, "loss": 0.0987, "lr": 0.29396491412309905, "epoch": 0.17711870617838907, "percentage": 9.06, "elapsed_time": "3:49:09", "remaining_time": "1 day, 14:19:29", "throughput": 334.82, "total_tokens": 4603552} {"current_steps": 3630, "total_steps": 40000, "loss": 0.091, "lr": 0.2939483624951753, "epoch": 0.1773630078420834, "percentage": 9.07, "elapsed_time": "3:49:12", "remaining_time": "1 day, 14:16:30", "throughput": 335.19, "total_tokens": 4609728} {"current_steps": 3635, "total_steps": 40000, "loss": 0.0779, "lr": 0.2939317886686051, "epoch": 0.17760730950577774, "percentage": 9.09, "elapsed_time": "3:49:15", "remaining_time": "1 day, 14:13:33", "throughput": 335.6, "total_tokens": 4616416} {"current_steps": 3640, "total_steps": 40000, "loss": 0.0691, "lr": 0.2939151926459443, "epoch": 0.17785161116947207, "percentage": 9.1, "elapsed_time": "3:49:18", "remaining_time": "1 day, 14:10:36", "throughput": 335.94, "total_tokens": 4622144} {"current_steps": 3645, "total_steps": 40000, "loss": 0.0952, "lr": 0.2938985744297522, "epoch": 0.1780959128331664, "percentage": 9.11, "elapsed_time": "3:49:21", "remaining_time": "1 day, 14:07:39", "throughput": 336.31, "total_tokens": 4628256} {"current_steps": 3650, "total_steps": 40000, "loss": 0.0651, "lr": 0.29388193402259166, "epoch": 0.17834021449686072, "percentage": 9.12, "elapsed_time": "3:49:24", "remaining_time": "1 day, 14:04:42", "throughput": 336.69, "total_tokens": 4634432} {"current_steps": 3655, "total_steps": 40000, "loss": 0.0719, "lr": 0.29386527142702873, "epoch": 0.17858451616055504, "percentage": 9.14, "elapsed_time": "3:49:27", "remaining_time": "1 day, 14:01:47", "throughput": 337.08, "total_tokens": 4640864} {"current_steps": 3660, "total_steps": 40000, "loss": 0.0902, "lr": 0.293848586645633, "epoch": 0.1788288178242494, "percentage": 9.15, "elapsed_time": "3:49:31", "remaining_time": "1 day, 13:58:51", "throughput": 337.45, "total_tokens": 4647040} {"current_steps": 3665, "total_steps": 40000, "loss": 0.0798, "lr": 0.2938318796809775, "epoch": 0.17907311948794372, "percentage": 9.16, "elapsed_time": "3:49:34", "remaining_time": "1 day, 13:55:57", "throughput": 337.84, "total_tokens": 4653472} {"current_steps": 3670, "total_steps": 40000, "loss": 0.0796, "lr": 0.29381515053563867, "epoch": 0.17931742115163804, "percentage": 9.18, "elapsed_time": "3:49:37", "remaining_time": "1 day, 13:53:03", "throughput": 338.23, "total_tokens": 4659936} {"current_steps": 3675, "total_steps": 40000, "loss": 0.0774, "lr": 0.29379839921219636, "epoch": 0.17956172281533236, "percentage": 9.19, "elapsed_time": "3:49:40", "remaining_time": "1 day, 13:50:08", "throughput": 338.62, "total_tokens": 4666240} {"current_steps": 3680, "total_steps": 40000, "loss": 0.0746, "lr": 0.2937816257132338, "epoch": 0.17980602447902672, "percentage": 9.2, "elapsed_time": "3:49:43", "remaining_time": "1 day, 13:47:15", "throughput": 338.99, "total_tokens": 4672384} {"current_steps": 3685, "total_steps": 40000, "loss": 0.0988, "lr": 0.2937648300413376, "epoch": 0.18005032614272104, "percentage": 9.21, "elapsed_time": "3:49:46", "remaining_time": "1 day, 13:44:20", "throughput": 339.33, "total_tokens": 4678112} {"current_steps": 3690, "total_steps": 40000, "loss": 0.0787, "lr": 0.293748012199098, "epoch": 0.18029462780641536, "percentage": 9.22, "elapsed_time": "3:49:49", "remaining_time": "1 day, 13:41:29", "throughput": 339.73, "total_tokens": 4684704} {"current_steps": 3695, "total_steps": 40000, "loss": 0.0771, "lr": 0.29373117218910844, "epoch": 0.1805389294701097, "percentage": 9.24, "elapsed_time": "3:49:52", "remaining_time": "1 day, 13:38:36", "throughput": 340.1, "total_tokens": 4690752} {"current_steps": 3700, "total_steps": 40000, "loss": 0.0537, "lr": 0.2937143100139659, "epoch": 0.180783231133804, "percentage": 9.25, "elapsed_time": "3:49:55", "remaining_time": "1 day, 13:35:45", "throughput": 340.48, "total_tokens": 4697120} {"current_steps": 3705, "total_steps": 40000, "loss": 0.0974, "lr": 0.29369742567627083, "epoch": 0.18102753279749836, "percentage": 9.26, "elapsed_time": "3:49:58", "remaining_time": "1 day, 13:32:55", "throughput": 340.89, "total_tokens": 4703840} {"current_steps": 3710, "total_steps": 40000, "loss": 0.0943, "lr": 0.29368051917862675, "epoch": 0.1812718344611927, "percentage": 9.28, "elapsed_time": "3:50:01", "remaining_time": "1 day, 13:30:04", "throughput": 341.25, "total_tokens": 4709888} {"current_steps": 3715, "total_steps": 40000, "loss": 0.0613, "lr": 0.2936635905236411, "epoch": 0.181516136124887, "percentage": 9.29, "elapsed_time": "3:50:04", "remaining_time": "1 day, 13:27:13", "throughput": 341.62, "total_tokens": 4716032} {"current_steps": 3720, "total_steps": 40000, "loss": 0.0854, "lr": 0.2936466397139244, "epoch": 0.18176043778858134, "percentage": 9.3, "elapsed_time": "3:50:07", "remaining_time": "1 day, 13:24:24", "throughput": 342.02, "total_tokens": 4722592} {"current_steps": 3725, "total_steps": 40000, "loss": 0.0868, "lr": 0.2936296667520907, "epoch": 0.18200473945227566, "percentage": 9.31, "elapsed_time": "3:50:10", "remaining_time": "1 day, 13:21:34", "throughput": 342.36, "total_tokens": 4728288} {"current_steps": 3730, "total_steps": 40000, "loss": 0.0787, "lr": 0.2936126716407574, "epoch": 0.18224904111597, "percentage": 9.32, "elapsed_time": "3:50:13", "remaining_time": "1 day, 13:18:45", "throughput": 342.73, "total_tokens": 4734432} {"current_steps": 3735, "total_steps": 40000, "loss": 0.0996, "lr": 0.29359565438254537, "epoch": 0.18249334277966434, "percentage": 9.34, "elapsed_time": "3:50:17", "remaining_time": "1 day, 13:15:57", "throughput": 343.14, "total_tokens": 4741280} {"current_steps": 3740, "total_steps": 40000, "loss": 0.0885, "lr": 0.29357861498007887, "epoch": 0.18273764444335866, "percentage": 9.35, "elapsed_time": "3:50:20", "remaining_time": "1 day, 13:13:09", "throughput": 343.51, "total_tokens": 4747328} {"current_steps": 3745, "total_steps": 40000, "loss": 0.0783, "lr": 0.29356155343598567, "epoch": 0.18298194610705298, "percentage": 9.36, "elapsed_time": "3:50:23", "remaining_time": "1 day, 13:10:21", "throughput": 343.87, "total_tokens": 4753472} {"current_steps": 3750, "total_steps": 40000, "loss": 0.066, "lr": 0.2935444697528968, "epoch": 0.1832262477707473, "percentage": 9.38, "elapsed_time": "3:50:26", "remaining_time": "1 day, 13:07:34", "throughput": 344.25, "total_tokens": 4759648} {"current_steps": 3755, "total_steps": 40000, "loss": 0.0804, "lr": 0.2935273639334468, "epoch": 0.18347054943444166, "percentage": 9.39, "elapsed_time": "3:50:29", "remaining_time": "1 day, 13:04:48", "throughput": 344.65, "total_tokens": 4766304} {"current_steps": 3760, "total_steps": 40000, "loss": 0.1144, "lr": 0.29351023598027365, "epoch": 0.18371485109813598, "percentage": 9.4, "elapsed_time": "3:50:32", "remaining_time": "1 day, 13:02:02", "throughput": 345.04, "total_tokens": 4772864} {"current_steps": 3765, "total_steps": 40000, "loss": 0.0677, "lr": 0.2934930858960186, "epoch": 0.1839591527618303, "percentage": 9.41, "elapsed_time": "3:50:35", "remaining_time": "1 day, 12:59:15", "throughput": 345.38, "total_tokens": 4778464} {"current_steps": 3770, "total_steps": 40000, "loss": 0.0635, "lr": 0.29347591368332643, "epoch": 0.18420345442552463, "percentage": 9.43, "elapsed_time": "3:50:38", "remaining_time": "1 day, 12:56:30", "throughput": 345.75, "total_tokens": 4784704} {"current_steps": 3775, "total_steps": 40000, "loss": 0.0566, "lr": 0.2934587193448454, "epoch": 0.18444775608921896, "percentage": 9.44, "elapsed_time": "3:50:41", "remaining_time": "1 day, 12:53:46", "throughput": 346.16, "total_tokens": 4791424} {"current_steps": 3780, "total_steps": 40000, "loss": 0.0714, "lr": 0.29344150288322696, "epoch": 0.1846920577529133, "percentage": 9.45, "elapsed_time": "3:50:45", "remaining_time": "1 day, 12:51:03", "throughput": 346.56, "total_tokens": 4798112} {"current_steps": 3785, "total_steps": 40000, "loss": 0.1041, "lr": 0.2934242643011263, "epoch": 0.18493635941660763, "percentage": 9.46, "elapsed_time": "3:50:48", "remaining_time": "1 day, 12:48:18", "throughput": 346.92, "total_tokens": 4804160} {"current_steps": 3790, "total_steps": 40000, "loss": 0.0724, "lr": 0.2934070036012016, "epoch": 0.18518066108030196, "percentage": 9.47, "elapsed_time": "3:50:51", "remaining_time": "1 day, 12:45:34", "throughput": 347.29, "total_tokens": 4810304} {"current_steps": 3795, "total_steps": 40000, "loss": 0.0911, "lr": 0.29338972078611475, "epoch": 0.18542496274399628, "percentage": 9.49, "elapsed_time": "3:50:54", "remaining_time": "1 day, 12:42:50", "throughput": 347.63, "total_tokens": 4816032} {"current_steps": 3800, "total_steps": 40000, "loss": 0.1035, "lr": 0.2933724158585311, "epoch": 0.1856692644076906, "percentage": 9.5, "elapsed_time": "3:50:57", "remaining_time": "1 day, 12:40:06", "throughput": 347.99, "total_tokens": 4822176} {"current_steps": 3800, "total_steps": 40000, "eval_loss": 0.08299132436513901, "epoch": 0.1856692644076906, "percentage": 9.5, "elapsed_time": "4:01:35", "remaining_time": "1 day, 14:21:31", "throughput": 332.66, "total_tokens": 4822176} {"current_steps": 3805, "total_steps": 40000, "loss": 0.0918, "lr": 0.29335508882111916, "epoch": 0.18591356607138496, "percentage": 9.51, "elapsed_time": "4:01:39", "remaining_time": "1 day, 14:18:45", "throughput": 332.99, "total_tokens": 4828096} {"current_steps": 3810, "total_steps": 40000, "loss": 0.0609, "lr": 0.29333773967655097, "epoch": 0.18615786773507928, "percentage": 9.53, "elapsed_time": "4:01:42", "remaining_time": "1 day, 14:15:55", "throughput": 333.38, "total_tokens": 4834848} {"current_steps": 3815, "total_steps": 40000, "loss": 0.0752, "lr": 0.2933203684275021, "epoch": 0.1864021693987736, "percentage": 9.54, "elapsed_time": "4:01:45", "remaining_time": "1 day, 14:13:04", "throughput": 333.72, "total_tokens": 4840864} {"current_steps": 3820, "total_steps": 40000, "loss": 0.0773, "lr": 0.2933029750766513, "epoch": 0.18664647106246793, "percentage": 9.55, "elapsed_time": "4:01:48", "remaining_time": "1 day, 14:10:14", "throughput": 334.08, "total_tokens": 4847040} {"current_steps": 3825, "total_steps": 40000, "loss": 0.0706, "lr": 0.2932855596266809, "epoch": 0.18689077272616225, "percentage": 9.56, "elapsed_time": "4:01:51", "remaining_time": "1 day, 14:07:24", "throughput": 334.44, "total_tokens": 4853344} {"current_steps": 3830, "total_steps": 40000, "loss": 0.0685, "lr": 0.2932681220802765, "epoch": 0.1871350743898566, "percentage": 9.57, "elapsed_time": "4:01:54", "remaining_time": "1 day, 14:04:34", "throughput": 334.8, "total_tokens": 4859488} {"current_steps": 3835, "total_steps": 40000, "loss": 0.1178, "lr": 0.2932506624401274, "epoch": 0.18737937605355093, "percentage": 9.59, "elapsed_time": "4:01:57", "remaining_time": "1 day, 14:01:46", "throughput": 335.16, "total_tokens": 4865824} {"current_steps": 3840, "total_steps": 40000, "loss": 0.0811, "lr": 0.29323318070892584, "epoch": 0.18762367771724525, "percentage": 9.6, "elapsed_time": "4:02:00", "remaining_time": "1 day, 13:58:58", "throughput": 335.53, "total_tokens": 4872128} {"current_steps": 3845, "total_steps": 40000, "loss": 0.0881, "lr": 0.29321567688936784, "epoch": 0.18786797938093958, "percentage": 9.61, "elapsed_time": "4:02:03", "remaining_time": "1 day, 13:56:10", "throughput": 335.88, "total_tokens": 4878368} {"current_steps": 3850, "total_steps": 40000, "loss": 0.0841, "lr": 0.29319815098415275, "epoch": 0.18811228104463393, "percentage": 9.62, "elapsed_time": "4:02:07", "remaining_time": "1 day, 13:53:23", "throughput": 336.25, "total_tokens": 4884704} {"current_steps": 3855, "total_steps": 40000, "loss": 0.0683, "lr": 0.2931806029959832, "epoch": 0.18835658270832825, "percentage": 9.64, "elapsed_time": "4:02:10", "remaining_time": "1 day, 13:50:35", "throughput": 336.59, "total_tokens": 4890656} {"current_steps": 3860, "total_steps": 40000, "loss": 0.0946, "lr": 0.29316303292756535, "epoch": 0.18860088437202258, "percentage": 9.65, "elapsed_time": "4:02:13", "remaining_time": "1 day, 13:47:48", "throughput": 336.91, "total_tokens": 4896352} {"current_steps": 3865, "total_steps": 40000, "loss": 0.0781, "lr": 0.29314544078160876, "epoch": 0.1888451860357169, "percentage": 9.66, "elapsed_time": "4:02:16", "remaining_time": "1 day, 13:45:02", "throughput": 337.28, "total_tokens": 4902720} {"current_steps": 3870, "total_steps": 40000, "loss": 0.0963, "lr": 0.2931278265608263, "epoch": 0.18908948769941122, "percentage": 9.68, "elapsed_time": "4:02:19", "remaining_time": "1 day, 13:42:16", "throughput": 337.65, "total_tokens": 4909120} {"current_steps": 3875, "total_steps": 40000, "loss": 0.1194, "lr": 0.29311019026793433, "epoch": 0.18933378936310558, "percentage": 9.69, "elapsed_time": "4:02:22", "remaining_time": "1 day, 13:39:31", "throughput": 337.99, "total_tokens": 4915104} {"current_steps": 3880, "total_steps": 40000, "loss": 0.0817, "lr": 0.29309253190565254, "epoch": 0.1895780910267999, "percentage": 9.7, "elapsed_time": "4:02:25", "remaining_time": "1 day, 13:36:46", "throughput": 338.35, "total_tokens": 4921344} {"current_steps": 3885, "total_steps": 40000, "loss": 0.0876, "lr": 0.2930748514767042, "epoch": 0.18982239269049422, "percentage": 9.71, "elapsed_time": "4:02:28", "remaining_time": "1 day, 13:34:02", "throughput": 338.71, "total_tokens": 4927712} {"current_steps": 3890, "total_steps": 40000, "loss": 0.0702, "lr": 0.29305714898381574, "epoch": 0.19006669435418855, "percentage": 9.72, "elapsed_time": "4:02:31", "remaining_time": "1 day, 13:31:18", "throughput": 339.08, "total_tokens": 4934112} {"current_steps": 3895, "total_steps": 40000, "loss": 0.077, "lr": 0.29303942442971714, "epoch": 0.19031099601788287, "percentage": 9.74, "elapsed_time": "4:02:34", "remaining_time": "1 day, 13:28:35", "throughput": 339.45, "total_tokens": 4940512} {"current_steps": 3900, "total_steps": 40000, "loss": 0.066, "lr": 0.2930216778171417, "epoch": 0.19055529768157722, "percentage": 9.75, "elapsed_time": "4:02:37", "remaining_time": "1 day, 13:25:52", "throughput": 339.81, "total_tokens": 4946912} {"current_steps": 3905, "total_steps": 40000, "loss": 0.0668, "lr": 0.2930039091488263, "epoch": 0.19079959934527155, "percentage": 9.76, "elapsed_time": "4:02:40", "remaining_time": "1 day, 13:23:10", "throughput": 340.2, "total_tokens": 4953568} {"current_steps": 3910, "total_steps": 40000, "loss": 0.1146, "lr": 0.29298611842751093, "epoch": 0.19104390100896587, "percentage": 9.78, "elapsed_time": "4:02:43", "remaining_time": "1 day, 13:20:27", "throughput": 340.55, "total_tokens": 4959680} {"current_steps": 3915, "total_steps": 40000, "loss": 0.0835, "lr": 0.29296830565593923, "epoch": 0.1912882026726602, "percentage": 9.79, "elapsed_time": "4:02:46", "remaining_time": "1 day, 13:17:45", "throughput": 340.9, "total_tokens": 4965824} {"current_steps": 3920, "total_steps": 40000, "loss": 0.0788, "lr": 0.2929504708368582, "epoch": 0.19153250433635452, "percentage": 9.8, "elapsed_time": "4:02:50", "remaining_time": "1 day, 13:15:04", "throughput": 341.29, "total_tokens": 4972608} {"current_steps": 3925, "total_steps": 40000, "loss": 0.073, "lr": 0.29293261397301806, "epoch": 0.19177680600004887, "percentage": 9.81, "elapsed_time": "4:02:53", "remaining_time": "1 day, 13:12:22", "throughput": 341.63, "total_tokens": 4978624} {"current_steps": 3930, "total_steps": 40000, "loss": 0.0698, "lr": 0.29291473506717275, "epoch": 0.1920211076637432, "percentage": 9.83, "elapsed_time": "4:02:56", "remaining_time": "1 day, 13:09:42", "throughput": 342.02, "total_tokens": 4985312} {"current_steps": 3935, "total_steps": 40000, "loss": 0.0539, "lr": 0.29289683412207923, "epoch": 0.19226540932743752, "percentage": 9.84, "elapsed_time": "4:02:59", "remaining_time": "1 day, 13:07:01", "throughput": 342.37, "total_tokens": 4991456} {"current_steps": 3940, "total_steps": 40000, "loss": 0.0957, "lr": 0.29287891114049813, "epoch": 0.19250971099113184, "percentage": 9.85, "elapsed_time": "4:03:02", "remaining_time": "1 day, 13:04:22", "throughput": 342.74, "total_tokens": 4997952} {"current_steps": 3945, "total_steps": 40000, "loss": 0.0464, "lr": 0.29286096612519347, "epoch": 0.19275401265482617, "percentage": 9.86, "elapsed_time": "4:03:05", "remaining_time": "1 day, 13:01:42", "throughput": 343.09, "total_tokens": 5004064} {"current_steps": 3950, "total_steps": 40000, "loss": 0.0728, "lr": 0.2928429990789325, "epoch": 0.19299831431852052, "percentage": 9.88, "elapsed_time": "4:03:08", "remaining_time": "1 day, 12:59:04", "throughput": 343.47, "total_tokens": 5010720} {"current_steps": 3955, "total_steps": 40000, "loss": 0.0711, "lr": 0.29282501000448596, "epoch": 0.19324261598221484, "percentage": 9.89, "elapsed_time": "4:03:11", "remaining_time": "1 day, 12:56:25", "throughput": 343.83, "total_tokens": 5017056} {"current_steps": 3960, "total_steps": 40000, "loss": 0.1036, "lr": 0.2928069989046281, "epoch": 0.19348691764590917, "percentage": 9.9, "elapsed_time": "4:03:14", "remaining_time": "1 day, 12:53:47", "throughput": 344.18, "total_tokens": 5023264} {"current_steps": 3965, "total_steps": 40000, "loss": 0.0718, "lr": 0.2927889657821363, "epoch": 0.1937312193096035, "percentage": 9.91, "elapsed_time": "4:03:17", "remaining_time": "1 day, 12:51:09", "throughput": 344.54, "total_tokens": 5029568} {"current_steps": 3970, "total_steps": 40000, "loss": 0.0909, "lr": 0.2927709106397916, "epoch": 0.19397552097329782, "percentage": 9.93, "elapsed_time": "4:03:20", "remaining_time": "1 day, 12:48:32", "throughput": 344.93, "total_tokens": 5036288} {"current_steps": 3975, "total_steps": 40000, "loss": 0.0575, "lr": 0.29275283348037834, "epoch": 0.19421982263699217, "percentage": 9.94, "elapsed_time": "4:03:24", "remaining_time": "1 day, 12:45:54", "throughput": 345.26, "total_tokens": 5042144} {"current_steps": 3980, "total_steps": 40000, "loss": 0.0732, "lr": 0.29273473430668423, "epoch": 0.1944641243006865, "percentage": 9.95, "elapsed_time": "4:03:27", "remaining_time": "1 day, 12:43:17", "throughput": 345.61, "total_tokens": 5048384} {"current_steps": 3985, "total_steps": 40000, "loss": 0.0661, "lr": 0.2927166131215003, "epoch": 0.19470842596438082, "percentage": 9.96, "elapsed_time": "4:03:30", "remaining_time": "1 day, 12:40:41", "throughput": 345.96, "total_tokens": 5054592} {"current_steps": 3990, "total_steps": 40000, "loss": 0.0561, "lr": 0.2926984699276212, "epoch": 0.19495272762807514, "percentage": 9.98, "elapsed_time": "4:03:33", "remaining_time": "1 day, 12:38:04", "throughput": 346.32, "total_tokens": 5060768} {"current_steps": 3995, "total_steps": 40000, "loss": 0.0701, "lr": 0.29268030472784473, "epoch": 0.19519702929176946, "percentage": 9.99, "elapsed_time": "4:03:36", "remaining_time": "1 day, 12:35:29", "throughput": 346.68, "total_tokens": 5067200} {"current_steps": 4000, "total_steps": 40000, "loss": 0.0908, "lr": 0.2926621175249723, "epoch": 0.19544133095546382, "percentage": 10.0, "elapsed_time": "4:03:39", "remaining_time": "1 day, 12:32:53", "throughput": 347.02, "total_tokens": 5073216} {"current_steps": 4000, "total_steps": 40000, "eval_loss": 0.08182398229837418, "epoch": 0.19544133095546382, "percentage": 10.0, "elapsed_time": "4:14:19", "remaining_time": "1 day, 14:08:52", "throughput": 332.47, "total_tokens": 5073216} {"current_steps": 4005, "total_steps": 40000, "loss": 0.1028, "lr": 0.29264390832180853, "epoch": 0.19568563261915814, "percentage": 10.01, "elapsed_time": "4:14:22", "remaining_time": "1 day, 14:06:15", "throughput": 332.79, "total_tokens": 5079360} {"current_steps": 4010, "total_steps": 40000, "loss": 0.0697, "lr": 0.29262567712116144, "epoch": 0.19592993428285246, "percentage": 10.03, "elapsed_time": "4:14:25", "remaining_time": "1 day, 14:03:32", "throughput": 333.12, "total_tokens": 5085344} {"current_steps": 4015, "total_steps": 40000, "loss": 0.0583, "lr": 0.29260742392584266, "epoch": 0.1961742359465468, "percentage": 10.04, "elapsed_time": "4:14:29", "remaining_time": "1 day, 14:00:51", "throughput": 333.49, "total_tokens": 5092160} {"current_steps": 4020, "total_steps": 40000, "loss": 0.0756, "lr": 0.292589148738667, "epoch": 0.19641853761024114, "percentage": 10.05, "elapsed_time": "4:14:32", "remaining_time": "1 day, 13:58:10", "throughput": 333.83, "total_tokens": 5098400} {"current_steps": 4025, "total_steps": 40000, "loss": 0.0663, "lr": 0.2925708515624527, "epoch": 0.19666283927393546, "percentage": 10.06, "elapsed_time": "4:14:35", "remaining_time": "1 day, 13:55:30", "throughput": 334.21, "total_tokens": 5105184} {"current_steps": 4030, "total_steps": 40000, "loss": 0.045, "lr": 0.29255253240002144, "epoch": 0.1969071409376298, "percentage": 10.08, "elapsed_time": "4:14:38", "remaining_time": "1 day, 13:52:50", "throughput": 334.59, "total_tokens": 5112064} {"current_steps": 4035, "total_steps": 40000, "loss": 0.053, "lr": 0.2925341912541983, "epoch": 0.1971514426013241, "percentage": 10.09, "elapsed_time": "4:14:41", "remaining_time": "1 day, 13:50:09", "throughput": 334.92, "total_tokens": 5118080} {"current_steps": 4040, "total_steps": 40000, "loss": 0.1025, "lr": 0.2925158281278116, "epoch": 0.19739574426501844, "percentage": 10.1, "elapsed_time": "4:14:44", "remaining_time": "1 day, 13:47:29", "throughput": 335.25, "total_tokens": 5124192} {"current_steps": 4045, "total_steps": 40000, "loss": 0.0568, "lr": 0.29249744302369324, "epoch": 0.1976400459287128, "percentage": 10.11, "elapsed_time": "4:14:47", "remaining_time": "1 day, 13:44:49", "throughput": 335.57, "total_tokens": 5130176} {"current_steps": 4050, "total_steps": 40000, "loss": 0.059, "lr": 0.29247903594467844, "epoch": 0.1978843475924071, "percentage": 10.12, "elapsed_time": "4:14:50", "remaining_time": "1 day, 13:42:10", "throughput": 335.95, "total_tokens": 5136992} {"current_steps": 4055, "total_steps": 40000, "loss": 0.0824, "lr": 0.2924606068936058, "epoch": 0.19812864925610144, "percentage": 10.14, "elapsed_time": "4:14:54", "remaining_time": "1 day, 13:39:31", "throughput": 336.32, "total_tokens": 5143680} {"current_steps": 4060, "total_steps": 40000, "loss": 0.0654, "lr": 0.2924421558733173, "epoch": 0.19837295091979576, "percentage": 10.15, "elapsed_time": "4:14:57", "remaining_time": "1 day, 13:36:52", "throughput": 336.66, "total_tokens": 5149856} {"current_steps": 4065, "total_steps": 40000, "loss": 0.0995, "lr": 0.2924236828866583, "epoch": 0.19861725258349008, "percentage": 10.16, "elapsed_time": "4:15:00", "remaining_time": "1 day, 13:34:15", "throughput": 337.0, "total_tokens": 5156192} {"current_steps": 4070, "total_steps": 40000, "loss": 0.076, "lr": 0.29240518793647763, "epoch": 0.19886155424718444, "percentage": 10.17, "elapsed_time": "4:15:03", "remaining_time": "1 day, 13:31:37", "throughput": 337.34, "total_tokens": 5162464} {"current_steps": 4075, "total_steps": 40000, "loss": 0.0643, "lr": 0.29238667102562743, "epoch": 0.19910585591087876, "percentage": 10.19, "elapsed_time": "4:15:06", "remaining_time": "1 day, 13:28:59", "throughput": 337.68, "total_tokens": 5168576} {"current_steps": 4080, "total_steps": 40000, "loss": 0.0607, "lr": 0.29236813215696317, "epoch": 0.19935015757457308, "percentage": 10.2, "elapsed_time": "4:15:09", "remaining_time": "1 day, 13:26:22", "throughput": 338.01, "total_tokens": 5174656} {"current_steps": 4085, "total_steps": 40000, "loss": 0.0647, "lr": 0.2923495713333439, "epoch": 0.1995944592382674, "percentage": 10.21, "elapsed_time": "4:15:12", "remaining_time": "1 day, 13:23:45", "throughput": 338.35, "total_tokens": 5180960} {"current_steps": 4090, "total_steps": 40000, "loss": 0.0557, "lr": 0.29233098855763173, "epoch": 0.19983876090196173, "percentage": 10.22, "elapsed_time": "4:15:15", "remaining_time": "1 day, 13:21:09", "throughput": 338.71, "total_tokens": 5187520} {"current_steps": 4095, "total_steps": 40000, "loss": 0.0687, "lr": 0.29231238383269254, "epoch": 0.20008306256565608, "percentage": 10.24, "elapsed_time": "4:15:18", "remaining_time": "1 day, 13:18:33", "throughput": 339.04, "total_tokens": 5193632} {"current_steps": 4100, "total_steps": 40000, "loss": 0.0615, "lr": 0.2922937571613954, "epoch": 0.2003273642293504, "percentage": 10.25, "elapsed_time": "4:15:21", "remaining_time": "1 day, 13:15:56", "throughput": 339.35, "total_tokens": 5199328} {"current_steps": 4105, "total_steps": 40000, "loss": 0.0855, "lr": 0.29227510854661265, "epoch": 0.20057166589304473, "percentage": 10.26, "elapsed_time": "4:15:24", "remaining_time": "1 day, 13:13:22", "throughput": 339.71, "total_tokens": 5205920} {"current_steps": 4110, "total_steps": 40000, "loss": 0.0815, "lr": 0.29225643799122025, "epoch": 0.20081596755673906, "percentage": 10.27, "elapsed_time": "4:15:27", "remaining_time": "1 day, 13:10:47", "throughput": 340.07, "total_tokens": 5212480} {"current_steps": 4115, "total_steps": 40000, "loss": 0.0721, "lr": 0.2922377454980974, "epoch": 0.20106026922043338, "percentage": 10.29, "elapsed_time": "4:15:30", "remaining_time": "1 day, 13:08:12", "throughput": 340.41, "total_tokens": 5218752} {"current_steps": 4120, "total_steps": 40000, "loss": 0.0909, "lr": 0.29221903107012676, "epoch": 0.20130457088412773, "percentage": 10.3, "elapsed_time": "4:15:33", "remaining_time": "1 day, 13:05:38", "throughput": 340.74, "total_tokens": 5224896} {"current_steps": 4125, "total_steps": 40000, "loss": 0.0936, "lr": 0.29220029471019426, "epoch": 0.20154887254782206, "percentage": 10.31, "elapsed_time": "4:15:37", "remaining_time": "1 day, 13:03:06", "throughput": 341.12, "total_tokens": 5231744} {"current_steps": 4130, "total_steps": 40000, "loss": 0.091, "lr": 0.2921815364211893, "epoch": 0.20179317421151638, "percentage": 10.32, "elapsed_time": "4:15:40", "remaining_time": "1 day, 13:00:33", "throughput": 341.47, "total_tokens": 5238144} {"current_steps": 4135, "total_steps": 40000, "loss": 0.0774, "lr": 0.29216275620600474, "epoch": 0.2020374758752107, "percentage": 10.34, "elapsed_time": "4:15:43", "remaining_time": "1 day, 12:58:00", "throughput": 341.82, "total_tokens": 5244608} {"current_steps": 4140, "total_steps": 40000, "loss": 0.0782, "lr": 0.29214395406753657, "epoch": 0.20228177753890503, "percentage": 10.35, "elapsed_time": "4:15:46", "remaining_time": "1 day, 12:55:27", "throughput": 342.16, "total_tokens": 5250912} {"current_steps": 4145, "total_steps": 40000, "loss": 0.0558, "lr": 0.2921251300086844, "epoch": 0.20252607920259938, "percentage": 10.36, "elapsed_time": "4:15:49", "remaining_time": "1 day, 12:52:55", "throughput": 342.52, "total_tokens": 5257536} {"current_steps": 4150, "total_steps": 40000, "loss": 0.0829, "lr": 0.2921062840323511, "epoch": 0.2027703808662937, "percentage": 10.38, "elapsed_time": "4:15:52", "remaining_time": "1 day, 12:50:24", "throughput": 342.88, "total_tokens": 5264160} {"current_steps": 4155, "total_steps": 40000, "loss": 0.0836, "lr": 0.29208741614144307, "epoch": 0.20301468252998803, "percentage": 10.39, "elapsed_time": "4:15:55", "remaining_time": "1 day, 12:47:52", "throughput": 343.22, "total_tokens": 5270432} {"current_steps": 4160, "total_steps": 40000, "loss": 0.0403, "lr": 0.2920685263388698, "epoch": 0.20325898419368235, "percentage": 10.4, "elapsed_time": "4:15:58", "remaining_time": "1 day, 12:45:21", "throughput": 343.55, "total_tokens": 5276544} {"current_steps": 4165, "total_steps": 40000, "loss": 0.0905, "lr": 0.2920496146275445, "epoch": 0.20350328585737668, "percentage": 10.41, "elapsed_time": "4:16:01", "remaining_time": "1 day, 12:42:50", "throughput": 343.89, "total_tokens": 5282816} {"current_steps": 4170, "total_steps": 40000, "loss": 0.0726, "lr": 0.29203068101038343, "epoch": 0.20374758752107103, "percentage": 10.42, "elapsed_time": "4:16:04", "remaining_time": "1 day, 12:40:20", "throughput": 344.22, "total_tokens": 5288960} {"current_steps": 4175, "total_steps": 40000, "loss": 0.1006, "lr": 0.2920117254903065, "epoch": 0.20399188918476535, "percentage": 10.44, "elapsed_time": "4:16:08", "remaining_time": "1 day, 12:37:50", "throughput": 344.57, "total_tokens": 5295392} {"current_steps": 4180, "total_steps": 40000, "loss": 0.0661, "lr": 0.29199274807023695, "epoch": 0.20423619084845968, "percentage": 10.45, "elapsed_time": "4:16:11", "remaining_time": "1 day, 12:35:20", "throughput": 344.91, "total_tokens": 5301600} {"current_steps": 4185, "total_steps": 40000, "loss": 0.0688, "lr": 0.29197374875310117, "epoch": 0.204480492512154, "percentage": 10.46, "elapsed_time": "4:16:14", "remaining_time": "1 day, 12:32:51", "throughput": 345.27, "total_tokens": 5308256} {"current_steps": 4190, "total_steps": 40000, "loss": 0.1124, "lr": 0.2919547275418292, "epoch": 0.20472479417584835, "percentage": 10.47, "elapsed_time": "4:16:17", "remaining_time": "1 day, 12:30:22", "throughput": 345.61, "total_tokens": 5314592} {"current_steps": 4195, "total_steps": 40000, "loss": 0.0832, "lr": 0.29193568443935436, "epoch": 0.20496909583954268, "percentage": 10.49, "elapsed_time": "4:16:20", "remaining_time": "1 day, 12:27:53", "throughput": 345.96, "total_tokens": 5321024} {"current_steps": 4200, "total_steps": 40000, "loss": 0.0807, "lr": 0.2919166194486133, "epoch": 0.205213397503237, "percentage": 10.5, "elapsed_time": "4:16:23", "remaining_time": "1 day, 12:25:26", "throughput": 346.32, "total_tokens": 5327680} {"current_steps": 4200, "total_steps": 40000, "eval_loss": 0.0783008560538292, "epoch": 0.205213397503237, "percentage": 10.5, "elapsed_time": "4:27:02", "remaining_time": "1 day, 13:56:16", "throughput": 332.5, "total_tokens": 5327680} {"current_steps": 4205, "total_steps": 40000, "loss": 0.1067, "lr": 0.2918975325725461, "epoch": 0.20545769916693132, "percentage": 10.51, "elapsed_time": "4:27:06", "remaining_time": "1 day, 13:53:47", "throughput": 332.83, "total_tokens": 5334240} {"current_steps": 4210, "total_steps": 40000, "loss": 0.0772, "lr": 0.29187842381409607, "epoch": 0.20570200083062565, "percentage": 10.53, "elapsed_time": "4:27:09", "remaining_time": "1 day, 13:51:12", "throughput": 333.15, "total_tokens": 5340416} {"current_steps": 4215, "total_steps": 40000, "loss": 0.0722, "lr": 0.29185929317621023, "epoch": 0.20594630249432, "percentage": 10.54, "elapsed_time": "4:27:12", "remaining_time": "1 day, 13:48:38", "throughput": 333.52, "total_tokens": 5347328} {"current_steps": 4220, "total_steps": 40000, "loss": 0.0735, "lr": 0.29184014066183867, "epoch": 0.20619060415801432, "percentage": 10.55, "elapsed_time": "4:27:16", "remaining_time": "1 day, 13:46:04", "throughput": 333.85, "total_tokens": 5353600} {"current_steps": 4225, "total_steps": 40000, "loss": 0.0505, "lr": 0.2918209662739349, "epoch": 0.20643490582170865, "percentage": 10.56, "elapsed_time": "4:27:19", "remaining_time": "1 day, 13:43:30", "throughput": 334.18, "total_tokens": 5359936} {"current_steps": 4230, "total_steps": 40000, "loss": 0.089, "lr": 0.29180177001545593, "epoch": 0.20667920748540297, "percentage": 10.57, "elapsed_time": "4:27:22", "remaining_time": "1 day, 13:40:58", "throughput": 334.52, "total_tokens": 5366560} {"current_steps": 4235, "total_steps": 40000, "loss": 0.1032, "lr": 0.29178255188936203, "epoch": 0.2069235091490973, "percentage": 10.59, "elapsed_time": "4:27:25", "remaining_time": "1 day, 13:38:24", "throughput": 334.84, "total_tokens": 5372640} {"current_steps": 4240, "total_steps": 40000, "loss": 0.0568, "lr": 0.2917633118986169, "epoch": 0.20716781081279165, "percentage": 10.6, "elapsed_time": "4:27:28", "remaining_time": "1 day, 13:35:52", "throughput": 335.19, "total_tokens": 5379328} {"current_steps": 4245, "total_steps": 40000, "loss": 0.1136, "lr": 0.2917440500461875, "epoch": 0.20741211247648597, "percentage": 10.61, "elapsed_time": "4:27:31", "remaining_time": "1 day, 13:33:22", "throughput": 335.6, "total_tokens": 5386944} {"current_steps": 4250, "total_steps": 40000, "loss": 0.0795, "lr": 0.29172476633504435, "epoch": 0.2076564141401803, "percentage": 10.62, "elapsed_time": "4:27:34", "remaining_time": "1 day, 13:30:49", "throughput": 335.92, "total_tokens": 5393120} {"current_steps": 4255, "total_steps": 40000, "loss": 0.0772, "lr": 0.2917054607681612, "epoch": 0.20790071580387462, "percentage": 10.64, "elapsed_time": "4:27:37", "remaining_time": "1 day, 13:28:17", "throughput": 336.22, "total_tokens": 5399040} {"current_steps": 4260, "total_steps": 40000, "loss": 0.069, "lr": 0.29168613334851523, "epoch": 0.20814501746756894, "percentage": 10.65, "elapsed_time": "4:27:40", "remaining_time": "1 day, 13:25:45", "throughput": 336.54, "total_tokens": 5405184} {"current_steps": 4265, "total_steps": 40000, "loss": 0.0773, "lr": 0.2916667840790869, "epoch": 0.2083893191312633, "percentage": 10.66, "elapsed_time": "4:27:44", "remaining_time": "1 day, 13:23:14", "throughput": 336.88, "total_tokens": 5411680} {"current_steps": 4270, "total_steps": 40000, "loss": 0.0777, "lr": 0.2916474129628603, "epoch": 0.20863362079495762, "percentage": 10.67, "elapsed_time": "4:27:47", "remaining_time": "1 day, 13:20:43", "throughput": 337.2, "total_tokens": 5417888} {"current_steps": 4275, "total_steps": 40000, "loss": 0.074, "lr": 0.29162802000282245, "epoch": 0.20887792245865194, "percentage": 10.69, "elapsed_time": "4:27:50", "remaining_time": "1 day, 13:18:13", "throughput": 337.53, "total_tokens": 5424160} {"current_steps": 4280, "total_steps": 40000, "loss": 0.063, "lr": 0.2916086052019642, "epoch": 0.20912222412234627, "percentage": 10.7, "elapsed_time": "4:27:53", "remaining_time": "1 day, 13:15:43", "throughput": 337.86, "total_tokens": 5430464} {"current_steps": 4285, "total_steps": 40000, "loss": 0.0755, "lr": 0.2915891685632794, "epoch": 0.2093665257860406, "percentage": 10.71, "elapsed_time": "4:27:56", "remaining_time": "1 day, 13:13:13", "throughput": 338.19, "total_tokens": 5436800} {"current_steps": 4290, "total_steps": 40000, "loss": 0.0759, "lr": 0.29156971008976545, "epoch": 0.20961082744973494, "percentage": 10.72, "elapsed_time": "4:27:59", "remaining_time": "1 day, 13:10:44", "throughput": 338.53, "total_tokens": 5443392} {"current_steps": 4295, "total_steps": 40000, "loss": 0.0551, "lr": 0.2915502297844232, "epoch": 0.20985512911342927, "percentage": 10.74, "elapsed_time": "4:28:02", "remaining_time": "1 day, 13:08:16", "throughput": 338.87, "total_tokens": 5449920} {"current_steps": 4300, "total_steps": 40000, "loss": 0.0844, "lr": 0.2915307276502566, "epoch": 0.2100994307771236, "percentage": 10.75, "elapsed_time": "4:28:05", "remaining_time": "1 day, 13:05:47", "throughput": 339.19, "total_tokens": 5456064} {"current_steps": 4305, "total_steps": 40000, "loss": 0.0799, "lr": 0.29151120369027334, "epoch": 0.21034373244081792, "percentage": 10.76, "elapsed_time": "4:28:08", "remaining_time": "1 day, 13:03:19", "throughput": 339.53, "total_tokens": 5462592} {"current_steps": 4310, "total_steps": 40000, "loss": 0.082, "lr": 0.29149165790748405, "epoch": 0.21058803410451224, "percentage": 10.78, "elapsed_time": "4:28:11", "remaining_time": "1 day, 13:00:51", "throughput": 339.87, "total_tokens": 5469088} {"current_steps": 4315, "total_steps": 40000, "loss": 0.078, "lr": 0.291472090304903, "epoch": 0.2108323357682066, "percentage": 10.79, "elapsed_time": "4:28:14", "remaining_time": "1 day, 12:58:24", "throughput": 340.2, "total_tokens": 5475456} {"current_steps": 4320, "total_steps": 40000, "loss": 0.0875, "lr": 0.2914525008855478, "epoch": 0.21107663743190092, "percentage": 10.8, "elapsed_time": "4:28:17", "remaining_time": "1 day, 12:55:57", "throughput": 340.54, "total_tokens": 5481952} {"current_steps": 4325, "total_steps": 40000, "loss": 0.1228, "lr": 0.2914328896524394, "epoch": 0.21132093909559524, "percentage": 10.81, "elapsed_time": "4:28:21", "remaining_time": "1 day, 12:53:30", "throughput": 340.87, "total_tokens": 5488320} {"current_steps": 4330, "total_steps": 40000, "loss": 0.0691, "lr": 0.291413256608602, "epoch": 0.21156524075928956, "percentage": 10.82, "elapsed_time": "4:28:24", "remaining_time": "1 day, 12:51:04", "throughput": 341.21, "total_tokens": 5494912} {"current_steps": 4335, "total_steps": 40000, "loss": 0.0882, "lr": 0.29139360175706336, "epoch": 0.2118095424229839, "percentage": 10.84, "elapsed_time": "4:28:27", "remaining_time": "1 day, 12:48:38", "throughput": 341.53, "total_tokens": 5501152} {"current_steps": 4340, "total_steps": 40000, "loss": 0.1074, "lr": 0.2913739251008544, "epoch": 0.21205384408667824, "percentage": 10.85, "elapsed_time": "4:28:30", "remaining_time": "1 day, 12:46:12", "throughput": 341.84, "total_tokens": 5507200} {"current_steps": 4345, "total_steps": 40000, "loss": 0.1126, "lr": 0.29135422664300964, "epoch": 0.21229814575037256, "percentage": 10.86, "elapsed_time": "4:28:33", "remaining_time": "1 day, 12:43:46", "throughput": 342.16, "total_tokens": 5513376} {"current_steps": 4350, "total_steps": 40000, "loss": 0.0902, "lr": 0.29133450638656677, "epoch": 0.2125424474140669, "percentage": 10.88, "elapsed_time": "4:28:36", "remaining_time": "1 day, 12:41:21", "throughput": 342.48, "total_tokens": 5519616} {"current_steps": 4355, "total_steps": 40000, "loss": 0.102, "lr": 0.2913147643345669, "epoch": 0.2127867490777612, "percentage": 10.89, "elapsed_time": "4:28:39", "remaining_time": "1 day, 12:38:55", "throughput": 342.79, "total_tokens": 5525600} {"current_steps": 4360, "total_steps": 40000, "loss": 0.073, "lr": 0.29129500049005447, "epoch": 0.21303105074145554, "percentage": 10.9, "elapsed_time": "4:28:42", "remaining_time": "1 day, 12:36:31", "throughput": 343.11, "total_tokens": 5531904} {"current_steps": 4365, "total_steps": 40000, "loss": 0.0772, "lr": 0.2912752148560773, "epoch": 0.2132753524051499, "percentage": 10.91, "elapsed_time": "4:28:45", "remaining_time": "1 day, 12:34:06", "throughput": 343.42, "total_tokens": 5537888} {"current_steps": 4370, "total_steps": 40000, "loss": 0.0776, "lr": 0.2912554074356866, "epoch": 0.2135196540688442, "percentage": 10.93, "elapsed_time": "4:28:48", "remaining_time": "1 day, 12:31:42", "throughput": 343.75, "total_tokens": 5544320} {"current_steps": 4375, "total_steps": 40000, "loss": 0.0901, "lr": 0.2912355782319371, "epoch": 0.21376395573253854, "percentage": 10.94, "elapsed_time": "4:28:51", "remaining_time": "1 day, 12:29:19", "throughput": 344.08, "total_tokens": 5550688} {"current_steps": 4380, "total_steps": 40000, "loss": 0.0814, "lr": 0.2912157272478864, "epoch": 0.21400825739623286, "percentage": 10.95, "elapsed_time": "4:28:54", "remaining_time": "1 day, 12:26:55", "throughput": 344.38, "total_tokens": 5556544} {"current_steps": 4385, "total_steps": 40000, "loss": 0.0841, "lr": 0.291195854486596, "epoch": 0.2142525590599272, "percentage": 10.96, "elapsed_time": "4:28:57", "remaining_time": "1 day, 12:24:32", "throughput": 344.71, "total_tokens": 5562912} {"current_steps": 4390, "total_steps": 40000, "loss": 0.0709, "lr": 0.2911759599511305, "epoch": 0.21449686072362154, "percentage": 10.97, "elapsed_time": "4:29:00", "remaining_time": "1 day, 12:22:08", "throughput": 345.02, "total_tokens": 5568928} {"current_steps": 4395, "total_steps": 40000, "loss": 0.0439, "lr": 0.29115604364455777, "epoch": 0.21474116238731586, "percentage": 10.99, "elapsed_time": "4:29:04", "remaining_time": "1 day, 12:19:46", "throughput": 345.36, "total_tokens": 5575520} {"current_steps": 4400, "total_steps": 40000, "loss": 0.0782, "lr": 0.2911361055699493, "epoch": 0.21498546405101018, "percentage": 11.0, "elapsed_time": "4:29:07", "remaining_time": "1 day, 12:17:25", "throughput": 345.71, "total_tokens": 5582272} {"current_steps": 4400, "total_steps": 40000, "eval_loss": 0.08176326751708984, "epoch": 0.21498546405101018, "percentage": 11.0, "elapsed_time": "4:39:46", "remaining_time": "1 day, 13:43:37", "throughput": 332.55, "total_tokens": 5582272} {"current_steps": 4405, "total_steps": 40000, "loss": 0.0704, "lr": 0.2911161457303797, "epoch": 0.2152297657147045, "percentage": 11.01, "elapsed_time": "4:39:50", "remaining_time": "1 day, 13:41:14", "throughput": 332.84, "total_tokens": 5588480} {"current_steps": 4410, "total_steps": 40000, "loss": 0.101, "lr": 0.291096164128927, "epoch": 0.21547406737839886, "percentage": 11.03, "elapsed_time": "4:39:53", "remaining_time": "1 day, 13:38:47", "throughput": 333.16, "total_tokens": 5594784} {"current_steps": 4415, "total_steps": 40000, "loss": 0.0513, "lr": 0.2910761607686727, "epoch": 0.21571836904209318, "percentage": 11.04, "elapsed_time": "4:39:56", "remaining_time": "1 day, 13:36:19", "throughput": 333.46, "total_tokens": 5600992} {"current_steps": 4420, "total_steps": 40000, "loss": 0.0807, "lr": 0.2910561356527016, "epoch": 0.2159626707057875, "percentage": 11.05, "elapsed_time": "4:39:59", "remaining_time": "1 day, 13:33:52", "throughput": 333.79, "total_tokens": 5607456} {"current_steps": 4425, "total_steps": 40000, "loss": 0.0808, "lr": 0.2910360887841017, "epoch": 0.21620697236948183, "percentage": 11.06, "elapsed_time": "4:40:02", "remaining_time": "1 day, 13:31:26", "throughput": 334.1, "total_tokens": 5613760} {"current_steps": 4430, "total_steps": 40000, "loss": 0.0858, "lr": 0.2910160201659645, "epoch": 0.21645127403317616, "percentage": 11.07, "elapsed_time": "4:40:05", "remaining_time": "1 day, 13:28:59", "throughput": 334.42, "total_tokens": 5620256} {"current_steps": 4435, "total_steps": 40000, "loss": 0.084, "lr": 0.29099592980138494, "epoch": 0.2166955756968705, "percentage": 11.09, "elapsed_time": "4:40:08", "remaining_time": "1 day, 13:26:33", "throughput": 334.73, "total_tokens": 5626464} {"current_steps": 4440, "total_steps": 40000, "loss": 0.0815, "lr": 0.29097581769346115, "epoch": 0.21693987736056483, "percentage": 11.1, "elapsed_time": "4:40:11", "remaining_time": "1 day, 13:24:06", "throughput": 335.03, "total_tokens": 5632512} {"current_steps": 4445, "total_steps": 40000, "loss": 0.071, "lr": 0.29095568384529463, "epoch": 0.21718417902425916, "percentage": 11.11, "elapsed_time": "4:40:15", "remaining_time": "1 day, 13:21:41", "throughput": 335.39, "total_tokens": 5639552} {"current_steps": 4450, "total_steps": 40000, "loss": 0.0907, "lr": 0.2909355282599903, "epoch": 0.21742848068795348, "percentage": 11.12, "elapsed_time": "4:40:18", "remaining_time": "1 day, 13:19:15", "throughput": 335.69, "total_tokens": 5645600} {"current_steps": 4455, "total_steps": 40000, "loss": 0.0716, "lr": 0.29091535094065635, "epoch": 0.2176727823516478, "percentage": 11.14, "elapsed_time": "4:40:21", "remaining_time": "1 day, 13:16:50", "throughput": 335.99, "total_tokens": 5651648} {"current_steps": 4460, "total_steps": 40000, "loss": 0.0623, "lr": 0.2908951518904045, "epoch": 0.21791708401534216, "percentage": 11.15, "elapsed_time": "4:40:24", "remaining_time": "1 day, 13:14:24", "throughput": 336.28, "total_tokens": 5657600} {"current_steps": 4465, "total_steps": 40000, "loss": 0.0767, "lr": 0.29087493111234963, "epoch": 0.21816138567903648, "percentage": 11.16, "elapsed_time": "4:40:27", "remaining_time": "1 day, 13:12:00", "throughput": 336.6, "total_tokens": 5663968} {"current_steps": 4470, "total_steps": 40000, "loss": 0.0777, "lr": 0.29085468860961, "epoch": 0.2184056873427308, "percentage": 11.18, "elapsed_time": "4:40:30", "remaining_time": "1 day, 13:09:35", "throughput": 336.89, "total_tokens": 5669888} {"current_steps": 4475, "total_steps": 40000, "loss": 0.0909, "lr": 0.2908344243853073, "epoch": 0.21864998900642513, "percentage": 11.19, "elapsed_time": "4:40:33", "remaining_time": "1 day, 13:07:11", "throughput": 337.2, "total_tokens": 5676160} {"current_steps": 4480, "total_steps": 40000, "loss": 0.0799, "lr": 0.2908141384425666, "epoch": 0.21889429067011945, "percentage": 11.2, "elapsed_time": "4:40:36", "remaining_time": "1 day, 13:04:48", "throughput": 337.51, "total_tokens": 5682432} {"current_steps": 4485, "total_steps": 40000, "loss": 0.0768, "lr": 0.2907938307845161, "epoch": 0.2191385923338138, "percentage": 11.21, "elapsed_time": "4:40:39", "remaining_time": "1 day, 13:02:25", "throughput": 337.83, "total_tokens": 5688960} {"current_steps": 4490, "total_steps": 40000, "loss": 0.1004, "lr": 0.2907735014142876, "epoch": 0.21938289399750813, "percentage": 11.22, "elapsed_time": "4:40:42", "remaining_time": "1 day, 13:00:03", "throughput": 338.17, "total_tokens": 5695648} {"current_steps": 4495, "total_steps": 40000, "loss": 0.0569, "lr": 0.2907531503350161, "epoch": 0.21962719566120245, "percentage": 11.24, "elapsed_time": "4:40:45", "remaining_time": "1 day, 12:57:39", "throughput": 338.46, "total_tokens": 5701632} {"current_steps": 4500, "total_steps": 40000, "loss": 0.0664, "lr": 0.29073277754983995, "epoch": 0.21987149732489678, "percentage": 11.25, "elapsed_time": "4:40:48", "remaining_time": "1 day, 12:55:17", "throughput": 338.76, "total_tokens": 5707648} {"current_steps": 4505, "total_steps": 40000, "loss": 0.0833, "lr": 0.290712383061901, "epoch": 0.2201157989885911, "percentage": 11.26, "elapsed_time": "4:40:51", "remaining_time": "1 day, 12:52:55", "throughput": 339.06, "total_tokens": 5713824} {"current_steps": 4510, "total_steps": 40000, "loss": 0.0942, "lr": 0.2906919668743443, "epoch": 0.22036010065228545, "percentage": 11.28, "elapsed_time": "4:40:54", "remaining_time": "1 day, 12:50:32", "throughput": 339.35, "total_tokens": 5719680} {"current_steps": 4515, "total_steps": 40000, "loss": 0.0807, "lr": 0.29067152899031823, "epoch": 0.22060440231597978, "percentage": 11.29, "elapsed_time": "4:40:57", "remaining_time": "1 day, 12:48:11", "throughput": 339.64, "total_tokens": 5725504} {"current_steps": 4520, "total_steps": 40000, "loss": 0.0546, "lr": 0.2906510694129746, "epoch": 0.2208487039796741, "percentage": 11.3, "elapsed_time": "4:41:00", "remaining_time": "1 day, 12:45:50", "throughput": 339.94, "total_tokens": 5731712} {"current_steps": 4525, "total_steps": 40000, "loss": 0.0522, "lr": 0.2906305881454685, "epoch": 0.22109300564336842, "percentage": 11.31, "elapsed_time": "4:41:03", "remaining_time": "1 day, 12:43:29", "throughput": 340.27, "total_tokens": 5738240} {"current_steps": 4530, "total_steps": 40000, "loss": 0.0695, "lr": 0.2906100851909585, "epoch": 0.22133730730706275, "percentage": 11.33, "elapsed_time": "4:41:07", "remaining_time": "1 day, 12:41:09", "throughput": 340.57, "total_tokens": 5744384} {"current_steps": 4535, "total_steps": 40000, "loss": 0.0542, "lr": 0.29058956055260626, "epoch": 0.2215816089707571, "percentage": 11.34, "elapsed_time": "4:41:10", "remaining_time": "1 day, 12:38:48", "throughput": 340.88, "total_tokens": 5750752} {"current_steps": 4540, "total_steps": 40000, "loss": 0.0751, "lr": 0.2905690142335771, "epoch": 0.22182591063445142, "percentage": 11.35, "elapsed_time": "4:41:13", "remaining_time": "1 day, 12:36:29", "throughput": 341.22, "total_tokens": 5757568} {"current_steps": 4545, "total_steps": 40000, "loss": 0.0809, "lr": 0.29054844623703946, "epoch": 0.22207021229814575, "percentage": 11.36, "elapsed_time": "4:41:16", "remaining_time": "1 day, 12:34:10", "throughput": 341.53, "total_tokens": 5763744} {"current_steps": 4550, "total_steps": 40000, "loss": 0.0835, "lr": 0.2905278565661651, "epoch": 0.22231451396184007, "percentage": 11.38, "elapsed_time": "4:41:19", "remaining_time": "1 day, 12:31:51", "throughput": 341.86, "total_tokens": 5770464} {"current_steps": 4555, "total_steps": 40000, "loss": 0.0637, "lr": 0.2905072452241293, "epoch": 0.22255881562553442, "percentage": 11.39, "elapsed_time": "4:41:22", "remaining_time": "1 day, 12:29:32", "throughput": 342.17, "total_tokens": 5776704} {"current_steps": 4560, "total_steps": 40000, "loss": 0.0938, "lr": 0.2904866122141106, "epoch": 0.22280311728922875, "percentage": 11.4, "elapsed_time": "4:41:25", "remaining_time": "1 day, 12:27:13", "throughput": 342.47, "total_tokens": 5782848} {"current_steps": 4565, "total_steps": 40000, "loss": 0.0666, "lr": 0.2904659575392908, "epoch": 0.22304741895292307, "percentage": 11.41, "elapsed_time": "4:41:28", "remaining_time": "1 day, 12:24:54", "throughput": 342.77, "total_tokens": 5788960} {"current_steps": 4570, "total_steps": 40000, "loss": 0.0686, "lr": 0.2904452812028551, "epoch": 0.2232917206166174, "percentage": 11.43, "elapsed_time": "4:41:31", "remaining_time": "1 day, 12:22:36", "throughput": 343.07, "total_tokens": 5795104} {"current_steps": 4575, "total_steps": 40000, "loss": 0.1073, "lr": 0.2904245832079922, "epoch": 0.22353602228031172, "percentage": 11.44, "elapsed_time": "4:41:34", "remaining_time": "1 day, 12:20:19", "throughput": 343.39, "total_tokens": 5801536} {"current_steps": 4580, "total_steps": 40000, "loss": 0.0878, "lr": 0.29040386355789377, "epoch": 0.22378032394400607, "percentage": 11.45, "elapsed_time": "4:41:37", "remaining_time": "1 day, 12:18:02", "throughput": 343.73, "total_tokens": 5808320} {"current_steps": 4585, "total_steps": 40000, "loss": 0.0757, "lr": 0.29038312225575524, "epoch": 0.2240246256077004, "percentage": 11.46, "elapsed_time": "4:41:41", "remaining_time": "1 day, 12:15:46", "throughput": 344.06, "total_tokens": 5815072} {"current_steps": 4590, "total_steps": 40000, "loss": 0.0463, "lr": 0.29036235930477505, "epoch": 0.22426892727139472, "percentage": 11.47, "elapsed_time": "4:41:44", "remaining_time": "1 day, 12:13:30", "throughput": 344.43, "total_tokens": 5822304} {"current_steps": 4595, "total_steps": 40000, "loss": 0.0886, "lr": 0.29034157470815514, "epoch": 0.22451322893508904, "percentage": 11.49, "elapsed_time": "4:41:47", "remaining_time": "1 day, 12:11:13", "throughput": 344.73, "total_tokens": 5828544} {"current_steps": 4600, "total_steps": 40000, "loss": 0.0663, "lr": 0.2903207684691008, "epoch": 0.22475753059878337, "percentage": 11.5, "elapsed_time": "4:41:50", "remaining_time": "1 day, 12:08:57", "throughput": 345.03, "total_tokens": 5834624} {"current_steps": 4600, "total_steps": 40000, "eval_loss": 0.0775083526968956, "epoch": 0.22475753059878337, "percentage": 11.5, "elapsed_time": "4:52:30", "remaining_time": "1 day, 13:31:01", "throughput": 332.45, "total_tokens": 5834624} {"current_steps": 4605, "total_steps": 40000, "loss": 0.0819, "lr": 0.29029994059082054, "epoch": 0.22500183226247772, "percentage": 11.51, "elapsed_time": "4:52:34", "remaining_time": "1 day, 13:28:50", "throughput": 332.72, "total_tokens": 5840928} {"current_steps": 4610, "total_steps": 40000, "loss": 0.0422, "lr": 0.2902790910765264, "epoch": 0.22524613392617204, "percentage": 11.53, "elapsed_time": "4:52:38", "remaining_time": "1 day, 13:26:29", "throughput": 333.04, "total_tokens": 5847552} {"current_steps": 4615, "total_steps": 40000, "loss": 0.0957, "lr": 0.29025821992943346, "epoch": 0.22549043558986637, "percentage": 11.54, "elapsed_time": "4:52:41", "remaining_time": "1 day, 13:24:07", "throughput": 333.32, "total_tokens": 5853536} {"current_steps": 4620, "total_steps": 40000, "loss": 0.0742, "lr": 0.29023732715276046, "epoch": 0.2257347372535607, "percentage": 11.55, "elapsed_time": "4:52:44", "remaining_time": "1 day, 13:21:46", "throughput": 333.63, "total_tokens": 5859936} {"current_steps": 4625, "total_steps": 40000, "loss": 0.06, "lr": 0.2902164127497293, "epoch": 0.22597903891725502, "percentage": 11.56, "elapsed_time": "4:52:47", "remaining_time": "1 day, 13:19:25", "throughput": 333.93, "total_tokens": 5866144} {"current_steps": 4630, "total_steps": 40000, "loss": 0.0701, "lr": 0.2901954767235652, "epoch": 0.22622334058094937, "percentage": 11.58, "elapsed_time": "4:52:50", "remaining_time": "1 day, 13:17:04", "throughput": 334.21, "total_tokens": 5872160} {"current_steps": 4635, "total_steps": 40000, "loss": 0.0535, "lr": 0.2901745190774968, "epoch": 0.2264676422446437, "percentage": 11.59, "elapsed_time": "4:52:53", "remaining_time": "1 day, 13:14:44", "throughput": 334.52, "total_tokens": 5878656} {"current_steps": 4640, "total_steps": 40000, "loss": 0.061, "lr": 0.290153539814756, "epoch": 0.22671194390833802, "percentage": 11.6, "elapsed_time": "4:52:56", "remaining_time": "1 day, 13:12:24", "throughput": 334.81, "total_tokens": 5884832} {"current_steps": 4645, "total_steps": 40000, "loss": 0.0937, "lr": 0.2901325389385781, "epoch": 0.22695624557203234, "percentage": 11.61, "elapsed_time": "4:52:59", "remaining_time": "1 day, 13:10:04", "throughput": 335.11, "total_tokens": 5891072} {"current_steps": 4650, "total_steps": 40000, "loss": 0.0693, "lr": 0.2901115164522016, "epoch": 0.22720054723572666, "percentage": 11.62, "elapsed_time": "4:53:02", "remaining_time": "1 day, 13:07:44", "throughput": 335.4, "total_tokens": 5897184} {"current_steps": 4655, "total_steps": 40000, "loss": 0.1009, "lr": 0.29009047235886865, "epoch": 0.22744484889942101, "percentage": 11.64, "elapsed_time": "4:53:05", "remaining_time": "1 day, 13:05:24", "throughput": 335.69, "total_tokens": 5903328} {"current_steps": 4660, "total_steps": 40000, "loss": 0.0561, "lr": 0.2900694066618243, "epoch": 0.22768915056311534, "percentage": 11.65, "elapsed_time": "4:53:08", "remaining_time": "1 day, 13:03:06", "throughput": 336.01, "total_tokens": 5909952} {"current_steps": 4665, "total_steps": 40000, "loss": 0.1068, "lr": 0.2900483193643172, "epoch": 0.22793345222680966, "percentage": 11.66, "elapsed_time": "4:53:11", "remaining_time": "1 day, 13:00:47", "throughput": 336.28, "total_tokens": 5915680} {"current_steps": 4670, "total_steps": 40000, "loss": 0.1238, "lr": 0.29002721046959934, "epoch": 0.228177753890504, "percentage": 11.68, "elapsed_time": "4:53:14", "remaining_time": "1 day, 12:58:28", "throughput": 336.57, "total_tokens": 5921792} {"current_steps": 4675, "total_steps": 40000, "loss": 0.0603, "lr": 0.29000607998092587, "epoch": 0.2284220555541983, "percentage": 11.69, "elapsed_time": "4:53:17", "remaining_time": "1 day, 12:56:10", "throughput": 336.87, "total_tokens": 5928224} {"current_steps": 4680, "total_steps": 40000, "loss": 0.0767, "lr": 0.2899849279015555, "epoch": 0.22866635721789266, "percentage": 11.7, "elapsed_time": "4:53:20", "remaining_time": "1 day, 12:53:53", "throughput": 337.19, "total_tokens": 5934848} {"current_steps": 4685, "total_steps": 40000, "loss": 0.0719, "lr": 0.28996375423475007, "epoch": 0.228910658881587, "percentage": 11.71, "elapsed_time": "4:53:23", "remaining_time": "1 day, 12:51:36", "throughput": 337.48, "total_tokens": 5941024} {"current_steps": 4690, "total_steps": 40000, "loss": 0.0606, "lr": 0.28994255898377486, "epoch": 0.2291549605452813, "percentage": 11.72, "elapsed_time": "4:53:26", "remaining_time": "1 day, 12:49:18", "throughput": 337.77, "total_tokens": 5947168} {"current_steps": 4695, "total_steps": 40000, "loss": 0.0462, "lr": 0.2899213421518984, "epoch": 0.22939926220897564, "percentage": 11.74, "elapsed_time": "4:53:29", "remaining_time": "1 day, 12:47:01", "throughput": 338.07, "total_tokens": 5953376} {"current_steps": 4700, "total_steps": 40000, "loss": 0.0802, "lr": 0.2899001037423926, "epoch": 0.22964356387266996, "percentage": 11.75, "elapsed_time": "4:53:33", "remaining_time": "1 day, 12:44:45", "throughput": 338.36, "total_tokens": 5959520} {"current_steps": 4705, "total_steps": 40000, "loss": 0.0766, "lr": 0.28987884375853273, "epoch": 0.2298878655363643, "percentage": 11.76, "elapsed_time": "4:53:36", "remaining_time": "1 day, 12:42:30", "throughput": 338.69, "total_tokens": 5966528} {"current_steps": 4710, "total_steps": 40000, "loss": 0.0698, "lr": 0.2898575622035974, "epoch": 0.23013216720005863, "percentage": 11.77, "elapsed_time": "4:53:39", "remaining_time": "1 day, 12:40:14", "throughput": 339.0, "total_tokens": 5972992} {"current_steps": 4715, "total_steps": 40000, "loss": 0.0996, "lr": 0.2898362590808683, "epoch": 0.23037646886375296, "percentage": 11.79, "elapsed_time": "4:53:42", "remaining_time": "1 day, 12:37:58", "throughput": 339.29, "total_tokens": 5979040} {"current_steps": 4720, "total_steps": 40000, "loss": 0.0781, "lr": 0.2898149343936308, "epoch": 0.23062077052744728, "percentage": 11.8, "elapsed_time": "4:53:45", "remaining_time": "1 day, 12:35:43", "throughput": 339.59, "total_tokens": 5985536} {"current_steps": 4725, "total_steps": 40000, "loss": 0.0663, "lr": 0.2897935881451734, "epoch": 0.23086507219114163, "percentage": 11.81, "elapsed_time": "4:53:48", "remaining_time": "1 day, 12:33:28", "throughput": 339.9, "total_tokens": 5991936} {"current_steps": 4730, "total_steps": 40000, "loss": 0.0742, "lr": 0.28977222033878797, "epoch": 0.23110937385483596, "percentage": 11.82, "elapsed_time": "4:53:51", "remaining_time": "1 day, 12:31:13", "throughput": 340.19, "total_tokens": 5998048} {"current_steps": 4735, "total_steps": 40000, "loss": 0.0638, "lr": 0.28975083097776966, "epoch": 0.23135367551853028, "percentage": 11.84, "elapsed_time": "4:53:54", "remaining_time": "1 day, 12:28:58", "throughput": 340.47, "total_tokens": 6004160} {"current_steps": 4740, "total_steps": 40000, "loss": 0.0888, "lr": 0.28972942006541696, "epoch": 0.2315979771822246, "percentage": 11.85, "elapsed_time": "4:53:57", "remaining_time": "1 day, 12:26:44", "throughput": 340.78, "total_tokens": 6010656} {"current_steps": 4745, "total_steps": 40000, "loss": 0.0889, "lr": 0.2897079876050318, "epoch": 0.23184227884591893, "percentage": 11.86, "elapsed_time": "4:54:00", "remaining_time": "1 day, 12:24:30", "throughput": 341.07, "total_tokens": 6016864} {"current_steps": 4750, "total_steps": 40000, "loss": 0.1037, "lr": 0.2896865335999192, "epoch": 0.23208658050961328, "percentage": 11.88, "elapsed_time": "4:54:03", "remaining_time": "1 day, 12:22:16", "throughput": 341.36, "total_tokens": 6022880} {"current_steps": 4755, "total_steps": 40000, "loss": 0.0567, "lr": 0.28966505805338777, "epoch": 0.2323308821733076, "percentage": 11.89, "elapsed_time": "4:54:07", "remaining_time": "1 day, 12:20:03", "throughput": 341.65, "total_tokens": 6029184} {"current_steps": 4760, "total_steps": 40000, "loss": 0.0693, "lr": 0.2896435609687492, "epoch": 0.23257518383700193, "percentage": 11.9, "elapsed_time": "4:54:10", "remaining_time": "1 day, 12:17:50", "throughput": 341.94, "total_tokens": 6035296} {"current_steps": 4765, "total_steps": 40000, "loss": 0.0475, "lr": 0.2896220423493187, "epoch": 0.23281948550069625, "percentage": 11.91, "elapsed_time": "4:54:13", "remaining_time": "1 day, 12:15:37", "throughput": 342.25, "total_tokens": 6041824} {"current_steps": 4770, "total_steps": 40000, "loss": 0.08, "lr": 0.28960050219841466, "epoch": 0.23306378716439058, "percentage": 11.92, "elapsed_time": "4:54:16", "remaining_time": "1 day, 12:13:25", "throughput": 342.55, "total_tokens": 6048096} {"current_steps": 4775, "total_steps": 40000, "loss": 0.0732, "lr": 0.28957894051935884, "epoch": 0.23330808882808493, "percentage": 11.94, "elapsed_time": "4:54:19", "remaining_time": "1 day, 12:11:12", "throughput": 342.84, "total_tokens": 6054368} {"current_steps": 4780, "total_steps": 40000, "loss": 0.0915, "lr": 0.2895573573154764, "epoch": 0.23355239049177925, "percentage": 11.95, "elapsed_time": "4:54:22", "remaining_time": "1 day, 12:09:00", "throughput": 343.15, "total_tokens": 6060832} {"current_steps": 4785, "total_steps": 40000, "loss": 0.0838, "lr": 0.28953575259009556, "epoch": 0.23379669215547358, "percentage": 11.96, "elapsed_time": "4:54:25", "remaining_time": "1 day, 12:06:48", "throughput": 343.44, "total_tokens": 6067008} {"current_steps": 4790, "total_steps": 40000, "loss": 0.0753, "lr": 0.2895141263465482, "epoch": 0.2340409938191679, "percentage": 11.97, "elapsed_time": "4:54:28", "remaining_time": "1 day, 12:04:36", "throughput": 343.73, "total_tokens": 6073152} {"current_steps": 4795, "total_steps": 40000, "loss": 0.0608, "lr": 0.28949247858816934, "epoch": 0.23428529548286223, "percentage": 11.99, "elapsed_time": "4:54:31", "remaining_time": "1 day, 12:02:26", "throughput": 344.03, "total_tokens": 6079648} {"current_steps": 4800, "total_steps": 40000, "loss": 0.0758, "lr": 0.2894708093182973, "epoch": 0.23452959714655658, "percentage": 12.0, "elapsed_time": "4:54:34", "remaining_time": "1 day, 12:00:14", "throughput": 344.31, "total_tokens": 6085600} {"current_steps": 4800, "total_steps": 40000, "eval_loss": 0.07764232158660889, "epoch": 0.23452959714655658, "percentage": 12.0, "elapsed_time": "5:05:13", "remaining_time": "1 day, 13:18:19", "throughput": 332.3, "total_tokens": 6085600} {"current_steps": 4805, "total_steps": 40000, "loss": 0.0462, "lr": 0.2894491185402737, "epoch": 0.2347738988102509, "percentage": 12.01, "elapsed_time": "5:05:17", "remaining_time": "1 day, 13:16:06", "throughput": 332.58, "total_tokens": 6092000} {"current_steps": 4810, "total_steps": 40000, "loss": 0.1076, "lr": 0.2894274062574437, "epoch": 0.23501820047394523, "percentage": 12.03, "elapsed_time": "5:05:20", "remaining_time": "1 day, 13:13:50", "throughput": 332.86, "total_tokens": 6098048} {"current_steps": 4815, "total_steps": 40000, "loss": 0.0861, "lr": 0.2894056724731554, "epoch": 0.23526250213763955, "percentage": 12.04, "elapsed_time": "5:05:23", "remaining_time": "1 day, 13:11:34", "throughput": 333.14, "total_tokens": 6104256} {"current_steps": 4820, "total_steps": 40000, "loss": 0.0723, "lr": 0.28938391719076056, "epoch": 0.23550680380133387, "percentage": 12.05, "elapsed_time": "5:05:26", "remaining_time": "1 day, 13:09:18", "throughput": 333.42, "total_tokens": 6110400} {"current_steps": 4825, "total_steps": 40000, "loss": 0.067, "lr": 0.28936214041361413, "epoch": 0.23575110546502823, "percentage": 12.06, "elapsed_time": "5:05:29", "remaining_time": "1 day, 13:07:03", "throughput": 333.71, "total_tokens": 6116640} {"current_steps": 4830, "total_steps": 40000, "loss": 0.0622, "lr": 0.2893403421450743, "epoch": 0.23599540712872255, "percentage": 12.07, "elapsed_time": "5:05:32", "remaining_time": "1 day, 13:04:48", "throughput": 334.0, "total_tokens": 6122976} {"current_steps": 4835, "total_steps": 40000, "loss": 0.0544, "lr": 0.2893185223885026, "epoch": 0.23623970879241687, "percentage": 12.09, "elapsed_time": "5:05:35", "remaining_time": "1 day, 13:02:34", "throughput": 334.31, "total_tokens": 6129696} {"current_steps": 4840, "total_steps": 40000, "loss": 0.0944, "lr": 0.289296681147264, "epoch": 0.2364840104561112, "percentage": 12.1, "elapsed_time": "5:05:38", "remaining_time": "1 day, 13:00:21", "throughput": 334.61, "total_tokens": 6136288} {"current_steps": 4845, "total_steps": 40000, "loss": 0.0811, "lr": 0.28927481842472663, "epoch": 0.23672831211980552, "percentage": 12.11, "elapsed_time": "5:05:41", "remaining_time": "1 day, 12:58:06", "throughput": 334.9, "total_tokens": 6142592} {"current_steps": 4850, "total_steps": 40000, "loss": 0.076, "lr": 0.28925293422426207, "epoch": 0.23697261378349987, "percentage": 12.12, "elapsed_time": "5:05:44", "remaining_time": "1 day, 12:55:53", "throughput": 335.19, "total_tokens": 6149088} {"current_steps": 4855, "total_steps": 40000, "loss": 0.0992, "lr": 0.28923102854924504, "epoch": 0.2372169154471942, "percentage": 12.14, "elapsed_time": "5:05:47", "remaining_time": "1 day, 12:53:39", "throughput": 335.47, "total_tokens": 6155232} {"current_steps": 4860, "total_steps": 40000, "loss": 0.0609, "lr": 0.2892091014030537, "epoch": 0.23746121711088852, "percentage": 12.15, "elapsed_time": "5:05:51", "remaining_time": "1 day, 12:51:26", "throughput": 335.78, "total_tokens": 6161856} {"current_steps": 4865, "total_steps": 40000, "loss": 0.0658, "lr": 0.2891871527890696, "epoch": 0.23770551877458285, "percentage": 12.16, "elapsed_time": "5:05:54", "remaining_time": "1 day, 12:49:13", "throughput": 336.06, "total_tokens": 6168160} {"current_steps": 4870, "total_steps": 40000, "loss": 0.0796, "lr": 0.2891651827106773, "epoch": 0.23794982043827717, "percentage": 12.17, "elapsed_time": "5:05:57", "remaining_time": "1 day, 12:47:00", "throughput": 336.35, "total_tokens": 6174496} {"current_steps": 4875, "total_steps": 40000, "loss": 0.065, "lr": 0.2891431911712651, "epoch": 0.23819412210197152, "percentage": 12.19, "elapsed_time": "5:06:00", "remaining_time": "1 day, 12:44:48", "throughput": 336.66, "total_tokens": 6181152} {"current_steps": 4880, "total_steps": 40000, "loss": 0.0805, "lr": 0.2891211781742241, "epoch": 0.23843842376566585, "percentage": 12.2, "elapsed_time": "5:06:03", "remaining_time": "1 day, 12:42:36", "throughput": 336.94, "total_tokens": 6187456} {"current_steps": 4885, "total_steps": 40000, "loss": 0.1046, "lr": 0.2890991437229492, "epoch": 0.23868272542936017, "percentage": 12.21, "elapsed_time": "5:06:06", "remaining_time": "1 day, 12:40:24", "throughput": 337.23, "total_tokens": 6193792} {"current_steps": 4890, "total_steps": 40000, "loss": 0.0907, "lr": 0.2890770878208383, "epoch": 0.2389270270930545, "percentage": 12.22, "elapsed_time": "5:06:09", "remaining_time": "1 day, 12:38:12", "throughput": 337.51, "total_tokens": 6199904} {"current_steps": 4895, "total_steps": 40000, "loss": 0.0695, "lr": 0.28905501047129273, "epoch": 0.23917132875674885, "percentage": 12.24, "elapsed_time": "5:06:12", "remaining_time": "1 day, 12:36:01", "throughput": 337.79, "total_tokens": 6206048} {"current_steps": 4900, "total_steps": 40000, "loss": 0.0903, "lr": 0.289032911677717, "epoch": 0.23941563042044317, "percentage": 12.25, "elapsed_time": "5:06:15", "remaining_time": "1 day, 12:33:50", "throughput": 338.07, "total_tokens": 6212224} {"current_steps": 4905, "total_steps": 40000, "loss": 0.0529, "lr": 0.28901079144351915, "epoch": 0.2396599320841375, "percentage": 12.26, "elapsed_time": "5:06:18", "remaining_time": "1 day, 12:31:39", "throughput": 338.35, "total_tokens": 6218464} {"current_steps": 4910, "total_steps": 40000, "loss": 0.1066, "lr": 0.2889886497721103, "epoch": 0.23990423374783182, "percentage": 12.28, "elapsed_time": "5:06:21", "remaining_time": "1 day, 12:29:28", "throughput": 338.63, "total_tokens": 6224640} {"current_steps": 4915, "total_steps": 40000, "loss": 0.0924, "lr": 0.28896648666690505, "epoch": 0.24014853541152614, "percentage": 12.29, "elapsed_time": "5:06:24", "remaining_time": "1 day, 12:27:17", "throughput": 338.89, "total_tokens": 6230464} {"current_steps": 4920, "total_steps": 40000, "loss": 0.0777, "lr": 0.2889443021313212, "epoch": 0.2403928370752205, "percentage": 12.3, "elapsed_time": "5:06:27", "remaining_time": "1 day, 12:25:07", "throughput": 339.19, "total_tokens": 6236928} {"current_steps": 4925, "total_steps": 40000, "loss": 0.0418, "lr": 0.28892209616877984, "epoch": 0.24063713873891482, "percentage": 12.31, "elapsed_time": "5:06:31", "remaining_time": "1 day, 12:22:57", "throughput": 339.5, "total_tokens": 6243712} {"current_steps": 4930, "total_steps": 40000, "loss": 0.0814, "lr": 0.28889986878270546, "epoch": 0.24088144040260914, "percentage": 12.32, "elapsed_time": "5:06:34", "remaining_time": "1 day, 12:20:47", "throughput": 339.77, "total_tokens": 6249792} {"current_steps": 4935, "total_steps": 40000, "loss": 0.1072, "lr": 0.28887761997652583, "epoch": 0.24112574206630347, "percentage": 12.34, "elapsed_time": "5:06:37", "remaining_time": "1 day, 12:18:38", "throughput": 340.05, "total_tokens": 6255872} {"current_steps": 4940, "total_steps": 40000, "loss": 0.0635, "lr": 0.2888553497536719, "epoch": 0.2413700437299978, "percentage": 12.35, "elapsed_time": "5:06:40", "remaining_time": "1 day, 12:16:29", "throughput": 340.34, "total_tokens": 6262304} {"current_steps": 4945, "total_steps": 40000, "loss": 0.0451, "lr": 0.2888330581175781, "epoch": 0.24161434539369214, "percentage": 12.36, "elapsed_time": "5:06:43", "remaining_time": "1 day, 12:14:21", "throughput": 340.63, "total_tokens": 6268832} {"current_steps": 4950, "total_steps": 40000, "loss": 0.0971, "lr": 0.28881074507168203, "epoch": 0.24185864705738647, "percentage": 12.38, "elapsed_time": "5:06:46", "remaining_time": "1 day, 12:12:13", "throughput": 340.93, "total_tokens": 6275328} {"current_steps": 4955, "total_steps": 40000, "loss": 0.0812, "lr": 0.2887884106194247, "epoch": 0.2421029487210808, "percentage": 12.39, "elapsed_time": "5:06:49", "remaining_time": "1 day, 12:10:04", "throughput": 341.22, "total_tokens": 6281664} {"current_steps": 4960, "total_steps": 40000, "loss": 0.0638, "lr": 0.28876605476425027, "epoch": 0.24234725038477511, "percentage": 12.4, "elapsed_time": "5:06:52", "remaining_time": "1 day, 12:07:56", "throughput": 341.5, "total_tokens": 6287936} {"current_steps": 4965, "total_steps": 40000, "loss": 0.0649, "lr": 0.2887436775096064, "epoch": 0.24259155204846944, "percentage": 12.41, "elapsed_time": "5:06:55", "remaining_time": "1 day, 12:05:48", "throughput": 341.76, "total_tokens": 6293824} {"current_steps": 4970, "total_steps": 40000, "loss": 0.0454, "lr": 0.2887212788589439, "epoch": 0.2428358537121638, "percentage": 12.43, "elapsed_time": "5:06:58", "remaining_time": "1 day, 12:03:41", "throughput": 342.06, "total_tokens": 6300416} {"current_steps": 4975, "total_steps": 40000, "loss": 0.0544, "lr": 0.2886988588157169, "epoch": 0.24308015537585811, "percentage": 12.44, "elapsed_time": "5:07:01", "remaining_time": "1 day, 12:01:34", "throughput": 342.35, "total_tokens": 6306784} {"current_steps": 4980, "total_steps": 40000, "loss": 0.0797, "lr": 0.28867641738338284, "epoch": 0.24332445703955244, "percentage": 12.45, "elapsed_time": "5:07:05", "remaining_time": "1 day, 11:59:26", "throughput": 342.64, "total_tokens": 6313152} {"current_steps": 4985, "total_steps": 40000, "loss": 0.0905, "lr": 0.2886539545654026, "epoch": 0.24356875870324676, "percentage": 12.46, "elapsed_time": "5:07:08", "remaining_time": "1 day, 11:57:20", "throughput": 342.94, "total_tokens": 6319776} {"current_steps": 4990, "total_steps": 40000, "loss": 0.0886, "lr": 0.28863147036524006, "epoch": 0.2438130603669411, "percentage": 12.47, "elapsed_time": "5:07:11", "remaining_time": "1 day, 11:55:14", "throughput": 343.25, "total_tokens": 6326624} {"current_steps": 4995, "total_steps": 40000, "loss": 0.0517, "lr": 0.2886089647863626, "epoch": 0.24405736203063544, "percentage": 12.49, "elapsed_time": "5:07:14", "remaining_time": "1 day, 11:53:08", "throughput": 343.54, "total_tokens": 6332960} {"current_steps": 5000, "total_steps": 40000, "loss": 0.0498, "lr": 0.288586437832241, "epoch": 0.24430166369432976, "percentage": 12.5, "elapsed_time": "5:07:17", "remaining_time": "1 day, 11:51:02", "throughput": 343.84, "total_tokens": 6339520} {"current_steps": 5000, "total_steps": 40000, "eval_loss": 0.07972920686006546, "epoch": 0.24430166369432976, "percentage": 12.5, "elapsed_time": "5:17:56", "remaining_time": "1 day, 13:05:33", "throughput": 332.33, "total_tokens": 6339520} {"current_steps": 5005, "total_steps": 40000, "loss": 0.0854, "lr": 0.28856388950634904, "epoch": 0.2445459653580241, "percentage": 12.51, "elapsed_time": "5:18:00", "remaining_time": "1 day, 13:03:29", "throughput": 332.6, "total_tokens": 6346080} {"current_steps": 5010, "total_steps": 40000, "loss": 0.0563, "lr": 0.288541319812164, "epoch": 0.2447902670217184, "percentage": 12.53, "elapsed_time": "5:18:03", "remaining_time": "1 day, 13:01:18", "throughput": 332.89, "total_tokens": 6352576} {"current_steps": 5015, "total_steps": 40000, "loss": 0.0861, "lr": 0.2885187287531665, "epoch": 0.24503456868541273, "percentage": 12.54, "elapsed_time": "5:18:06", "remaining_time": "1 day, 12:59:07", "throughput": 333.14, "total_tokens": 6358496} {"current_steps": 5020, "total_steps": 40000, "loss": 0.0727, "lr": 0.2884961163328402, "epoch": 0.2452788703491071, "percentage": 12.55, "elapsed_time": "5:18:09", "remaining_time": "1 day, 12:56:57", "throughput": 333.43, "total_tokens": 6364960} {"current_steps": 5025, "total_steps": 40000, "loss": 0.0708, "lr": 0.28847348255467237, "epoch": 0.2455231720128014, "percentage": 12.56, "elapsed_time": "5:18:12", "remaining_time": "1 day, 12:54:46", "throughput": 333.68, "total_tokens": 6370784} {"current_steps": 5030, "total_steps": 40000, "loss": 0.0628, "lr": 0.28845082742215333, "epoch": 0.24576747367649573, "percentage": 12.57, "elapsed_time": "5:18:15", "remaining_time": "1 day, 12:52:37", "throughput": 333.95, "total_tokens": 6376928} {"current_steps": 5035, "total_steps": 40000, "loss": 0.0934, "lr": 0.2884281509387769, "epoch": 0.24601177534019006, "percentage": 12.59, "elapsed_time": "5:18:18", "remaining_time": "1 day, 12:50:27", "throughput": 334.22, "total_tokens": 6383072} {"current_steps": 5040, "total_steps": 40000, "loss": 0.0567, "lr": 0.2884054531080399, "epoch": 0.24625607700388438, "percentage": 12.6, "elapsed_time": "5:18:21", "remaining_time": "1 day, 12:48:18", "throughput": 334.49, "total_tokens": 6389216} {"current_steps": 5045, "total_steps": 40000, "loss": 0.0418, "lr": 0.28838273393344277, "epoch": 0.24650037866757873, "percentage": 12.61, "elapsed_time": "5:18:24", "remaining_time": "1 day, 12:46:10", "throughput": 334.77, "total_tokens": 6395680} {"current_steps": 5050, "total_steps": 40000, "loss": 0.054, "lr": 0.288359993418489, "epoch": 0.24674468033127306, "percentage": 12.62, "elapsed_time": "5:18:27", "remaining_time": "1 day, 12:44:01", "throughput": 335.04, "total_tokens": 6401856} {"current_steps": 5055, "total_steps": 40000, "loss": 0.0728, "lr": 0.28833723156668556, "epoch": 0.24698898199496738, "percentage": 12.64, "elapsed_time": "5:18:30", "remaining_time": "1 day, 12:41:53", "throughput": 335.31, "total_tokens": 6408064} {"current_steps": 5060, "total_steps": 40000, "loss": 0.0842, "lr": 0.2883144483815425, "epoch": 0.2472332836586617, "percentage": 12.65, "elapsed_time": "5:18:34", "remaining_time": "1 day, 12:39:44", "throughput": 335.59, "total_tokens": 6414496} {"current_steps": 5065, "total_steps": 40000, "loss": 0.0564, "lr": 0.28829164386657335, "epoch": 0.24747758532235606, "percentage": 12.66, "elapsed_time": "5:18:37", "remaining_time": "1 day, 12:37:36", "throughput": 335.86, "total_tokens": 6420576} {"current_steps": 5070, "total_steps": 40000, "loss": 0.0693, "lr": 0.28826881802529486, "epoch": 0.24772188698605038, "percentage": 12.68, "elapsed_time": "5:18:40", "remaining_time": "1 day, 12:35:28", "throughput": 336.13, "total_tokens": 6426816} {"current_steps": 5075, "total_steps": 40000, "loss": 0.0416, "lr": 0.28824597086122705, "epoch": 0.2479661886497447, "percentage": 12.69, "elapsed_time": "5:18:43", "remaining_time": "1 day, 12:33:20", "throughput": 336.38, "total_tokens": 6432640} {"current_steps": 5080, "total_steps": 40000, "loss": 0.045, "lr": 0.28822310237789317, "epoch": 0.24821049031343903, "percentage": 12.7, "elapsed_time": "5:18:46", "remaining_time": "1 day, 12:31:13", "throughput": 336.66, "total_tokens": 6438912} {"current_steps": 5085, "total_steps": 40000, "loss": 0.0816, "lr": 0.2882002125788199, "epoch": 0.24845479197713335, "percentage": 12.71, "elapsed_time": "5:18:49", "remaining_time": "1 day, 12:29:05", "throughput": 336.92, "total_tokens": 6445024} {"current_steps": 5090, "total_steps": 40000, "loss": 0.0781, "lr": 0.2881773014675371, "epoch": 0.2486990936408277, "percentage": 12.72, "elapsed_time": "5:18:52", "remaining_time": "1 day, 12:26:58", "throughput": 337.19, "total_tokens": 6451264} {"current_steps": 5095, "total_steps": 40000, "loss": 0.0902, "lr": 0.288154369047578, "epoch": 0.24894339530452203, "percentage": 12.74, "elapsed_time": "5:18:55", "remaining_time": "1 day, 12:24:52", "throughput": 337.48, "total_tokens": 6457760} {"current_steps": 5100, "total_steps": 40000, "loss": 0.0703, "lr": 0.28813141532247905, "epoch": 0.24918769696821635, "percentage": 12.75, "elapsed_time": "5:18:58", "remaining_time": "1 day, 12:22:46", "throughput": 337.75, "total_tokens": 6463904} {"current_steps": 5105, "total_steps": 40000, "loss": 0.0681, "lr": 0.28810844029578, "epoch": 0.24943199863191068, "percentage": 12.76, "elapsed_time": "5:19:01", "remaining_time": "1 day, 12:20:40", "throughput": 338.03, "total_tokens": 6470304} {"current_steps": 5110, "total_steps": 40000, "loss": 0.08, "lr": 0.2880854439710238, "epoch": 0.249676300295605, "percentage": 12.78, "elapsed_time": "5:19:04", "remaining_time": "1 day, 12:18:35", "throughput": 338.31, "total_tokens": 6476864} {"current_steps": 5115, "total_steps": 40000, "loss": 0.0672, "lr": 0.28806242635175694, "epoch": 0.24992060195929935, "percentage": 12.79, "elapsed_time": "5:19:07", "remaining_time": "1 day, 12:16:30", "throughput": 338.59, "total_tokens": 6483232} {"current_steps": 5120, "total_steps": 40000, "loss": 0.0853, "lr": 0.2880393874415289, "epoch": 0.25016490362299365, "percentage": 12.8, "elapsed_time": "5:19:10", "remaining_time": "1 day, 12:14:25", "throughput": 338.86, "total_tokens": 6489536} {"current_steps": 5125, "total_steps": 40000, "loss": 0.0606, "lr": 0.2880163272438926, "epoch": 0.250409205286688, "percentage": 12.81, "elapsed_time": "5:19:13", "remaining_time": "1 day, 12:12:20", "throughput": 339.15, "total_tokens": 6496160} {"current_steps": 5130, "total_steps": 40000, "loss": 0.0771, "lr": 0.2879932457624042, "epoch": 0.25065350695038235, "percentage": 12.83, "elapsed_time": "5:19:17", "remaining_time": "1 day, 12:10:16", "throughput": 339.46, "total_tokens": 6503072} {"current_steps": 5135, "total_steps": 40000, "loss": 0.0577, "lr": 0.2879701430006232, "epoch": 0.2508978086140767, "percentage": 12.84, "elapsed_time": "5:19:20", "remaining_time": "1 day, 12:08:13", "throughput": 339.76, "total_tokens": 6509952} {"current_steps": 5140, "total_steps": 40000, "loss": 0.1261, "lr": 0.28794701896211233, "epoch": 0.251142110277771, "percentage": 12.85, "elapsed_time": "5:19:23", "remaining_time": "1 day, 12:06:09", "throughput": 340.04, "total_tokens": 6516384} {"current_steps": 5145, "total_steps": 40000, "loss": 0.0675, "lr": 0.28792387365043753, "epoch": 0.2513864119414653, "percentage": 12.86, "elapsed_time": "5:19:26", "remaining_time": "1 day, 12:04:05", "throughput": 340.33, "total_tokens": 6522912} {"current_steps": 5150, "total_steps": 40000, "loss": 0.0475, "lr": 0.28790070706916815, "epoch": 0.25163071360515965, "percentage": 12.88, "elapsed_time": "5:19:29", "remaining_time": "1 day, 12:02:01", "throughput": 340.6, "total_tokens": 6529184} {"current_steps": 5155, "total_steps": 40000, "loss": 0.1111, "lr": 0.2878775192218768, "epoch": 0.251875015268854, "percentage": 12.89, "elapsed_time": "5:19:32", "remaining_time": "1 day, 11:59:58", "throughput": 340.88, "total_tokens": 6535616} {"current_steps": 5160, "total_steps": 40000, "loss": 0.109, "lr": 0.2878543101121393, "epoch": 0.2521193169325483, "percentage": 12.9, "elapsed_time": "5:19:35", "remaining_time": "1 day, 11:57:54", "throughput": 341.14, "total_tokens": 6541728} {"current_steps": 5165, "total_steps": 40000, "loss": 0.0771, "lr": 0.28783107974353483, "epoch": 0.2523636185962426, "percentage": 12.91, "elapsed_time": "5:19:38", "remaining_time": "1 day, 11:55:51", "throughput": 341.44, "total_tokens": 6548416} {"current_steps": 5170, "total_steps": 40000, "loss": 0.0904, "lr": 0.2878078281196457, "epoch": 0.25260792025993695, "percentage": 12.93, "elapsed_time": "5:19:42", "remaining_time": "1 day, 11:53:48", "throughput": 341.71, "total_tokens": 6554688} {"current_steps": 5175, "total_steps": 40000, "loss": 0.0541, "lr": 0.28778455524405777, "epoch": 0.2528522219236313, "percentage": 12.94, "elapsed_time": "5:19:45", "remaining_time": "1 day, 11:51:45", "throughput": 341.97, "total_tokens": 6560768} {"current_steps": 5180, "total_steps": 40000, "loss": 0.0662, "lr": 0.2877612611203598, "epoch": 0.25309652358732565, "percentage": 12.95, "elapsed_time": "5:19:48", "remaining_time": "1 day, 11:49:42", "throughput": 342.24, "total_tokens": 6566976} {"current_steps": 5185, "total_steps": 40000, "loss": 0.1006, "lr": 0.28773794575214423, "epoch": 0.25334082525102, "percentage": 12.96, "elapsed_time": "5:19:51", "remaining_time": "1 day, 11:47:40", "throughput": 342.5, "total_tokens": 6573056} {"current_steps": 5190, "total_steps": 40000, "loss": 0.0726, "lr": 0.28771460914300645, "epoch": 0.2535851269147143, "percentage": 12.97, "elapsed_time": "5:19:54", "remaining_time": "1 day, 11:45:38", "throughput": 342.79, "total_tokens": 6579584} {"current_steps": 5195, "total_steps": 40000, "loss": 0.0724, "lr": 0.2876912512965454, "epoch": 0.2538294285784086, "percentage": 12.99, "elapsed_time": "5:19:57", "remaining_time": "1 day, 11:43:37", "throughput": 343.06, "total_tokens": 6585856} {"current_steps": 5200, "total_steps": 40000, "loss": 0.1046, "lr": 0.287667872216363, "epoch": 0.25407373024210295, "percentage": 13.0, "elapsed_time": "5:20:00", "remaining_time": "1 day, 11:41:35", "throughput": 343.33, "total_tokens": 6592160} {"current_steps": 5200, "total_steps": 40000, "eval_loss": 0.07866477221250534, "epoch": 0.25407373024210295, "percentage": 13.0, "elapsed_time": "5:30:39", "remaining_time": "1 day, 12:52:52", "throughput": 332.27, "total_tokens": 6592160} {"current_steps": 5205, "total_steps": 40000, "loss": 0.0587, "lr": 0.2876444719060647, "epoch": 0.25431803190579727, "percentage": 13.01, "elapsed_time": "5:30:43", "remaining_time": "1 day, 12:50:50", "throughput": 332.53, "total_tokens": 6598496} {"current_steps": 5210, "total_steps": 40000, "loss": 0.0798, "lr": 0.287621050369259, "epoch": 0.2545623335694916, "percentage": 13.03, "elapsed_time": "5:30:46", "remaining_time": "1 day, 12:48:44", "throughput": 332.78, "total_tokens": 6604512} {"current_steps": 5215, "total_steps": 40000, "loss": 0.0934, "lr": 0.28759760760955794, "epoch": 0.2548066352331859, "percentage": 13.04, "elapsed_time": "5:30:49", "remaining_time": "1 day, 12:46:38", "throughput": 333.04, "total_tokens": 6610592} {"current_steps": 5220, "total_steps": 40000, "loss": 0.0884, "lr": 0.2875741436305766, "epoch": 0.25505093689688024, "percentage": 13.05, "elapsed_time": "5:30:52", "remaining_time": "1 day, 12:44:32", "throughput": 333.31, "total_tokens": 6617056} {"current_steps": 5225, "total_steps": 40000, "loss": 0.0784, "lr": 0.28755065843593347, "epoch": 0.2552952385605746, "percentage": 13.06, "elapsed_time": "5:30:55", "remaining_time": "1 day, 12:42:27", "throughput": 333.59, "total_tokens": 6623584} {"current_steps": 5230, "total_steps": 40000, "loss": 0.0904, "lr": 0.2875271520292502, "epoch": 0.25553954022426895, "percentage": 13.08, "elapsed_time": "5:30:58", "remaining_time": "1 day, 12:40:23", "throughput": 333.85, "total_tokens": 6629856} {"current_steps": 5235, "total_steps": 40000, "loss": 0.0504, "lr": 0.28750362441415184, "epoch": 0.25578384188796327, "percentage": 13.09, "elapsed_time": "5:31:01", "remaining_time": "1 day, 12:38:18", "throughput": 334.1, "total_tokens": 6635776} {"current_steps": 5240, "total_steps": 40000, "loss": 0.073, "lr": 0.28748007559426664, "epoch": 0.2560281435516576, "percentage": 13.1, "elapsed_time": "5:31:04", "remaining_time": "1 day, 12:36:15", "throughput": 334.41, "total_tokens": 6643104} {"current_steps": 5245, "total_steps": 40000, "loss": 0.089, "lr": 0.2874565055732261, "epoch": 0.2562724452153519, "percentage": 13.11, "elapsed_time": "5:31:07", "remaining_time": "1 day, 12:34:11", "throughput": 334.68, "total_tokens": 6649344} {"current_steps": 5250, "total_steps": 40000, "loss": 0.0982, "lr": 0.28743291435466495, "epoch": 0.25651674687904624, "percentage": 13.12, "elapsed_time": "5:31:11", "remaining_time": "1 day, 12:32:07", "throughput": 334.94, "total_tokens": 6655520} {"current_steps": 5255, "total_steps": 40000, "loss": 0.0807, "lr": 0.2874093019422214, "epoch": 0.25676104854274057, "percentage": 13.14, "elapsed_time": "5:31:14", "remaining_time": "1 day, 12:30:03", "throughput": 335.22, "total_tokens": 6662112} {"current_steps": 5260, "total_steps": 40000, "loss": 0.087, "lr": 0.28738566833953666, "epoch": 0.2570053502064349, "percentage": 13.15, "elapsed_time": "5:31:17", "remaining_time": "1 day, 12:28:00", "throughput": 335.49, "total_tokens": 6668544} {"current_steps": 5265, "total_steps": 40000, "loss": 0.0751, "lr": 0.28736201355025537, "epoch": 0.2572496518701292, "percentage": 13.16, "elapsed_time": "5:31:20", "remaining_time": "1 day, 12:25:57", "throughput": 335.75, "total_tokens": 6674848} {"current_steps": 5270, "total_steps": 40000, "loss": 0.1036, "lr": 0.28733833757802535, "epoch": 0.25749395353382354, "percentage": 13.18, "elapsed_time": "5:31:23", "remaining_time": "1 day, 12:23:54", "throughput": 336.01, "total_tokens": 6681088} {"current_steps": 5275, "total_steps": 40000, "loss": 0.0738, "lr": 0.28731464042649785, "epoch": 0.2577382551975179, "percentage": 13.19, "elapsed_time": "5:31:26", "remaining_time": "1 day, 12:21:52", "throughput": 336.3, "total_tokens": 6687808} {"current_steps": 5280, "total_steps": 40000, "loss": 0.0563, "lr": 0.2872909220993271, "epoch": 0.25798255686121224, "percentage": 13.2, "elapsed_time": "5:31:29", "remaining_time": "1 day, 12:19:50", "throughput": 336.58, "total_tokens": 6694528} {"current_steps": 5285, "total_steps": 40000, "loss": 0.0677, "lr": 0.287267182600171, "epoch": 0.25822685852490657, "percentage": 13.21, "elapsed_time": "5:31:32", "remaining_time": "1 day, 12:17:47", "throughput": 336.85, "total_tokens": 6700800} {"current_steps": 5290, "total_steps": 40000, "loss": 0.0597, "lr": 0.2872434219326902, "epoch": 0.2584711601886009, "percentage": 13.23, "elapsed_time": "5:31:35", "remaining_time": "1 day, 12:15:45", "throughput": 337.09, "total_tokens": 6706656} {"current_steps": 5295, "total_steps": 40000, "loss": 0.1085, "lr": 0.28721964010054907, "epoch": 0.2587154618522952, "percentage": 13.24, "elapsed_time": "5:31:38", "remaining_time": "1 day, 12:13:43", "throughput": 337.37, "total_tokens": 6713376} {"current_steps": 5300, "total_steps": 40000, "loss": 0.079, "lr": 0.28719583710741503, "epoch": 0.25895976351598954, "percentage": 13.25, "elapsed_time": "5:31:42", "remaining_time": "1 day, 12:11:42", "throughput": 337.64, "total_tokens": 6719712} {"current_steps": 5305, "total_steps": 40000, "loss": 0.0396, "lr": 0.28717201295695877, "epoch": 0.25920406517968386, "percentage": 13.26, "elapsed_time": "5:31:45", "remaining_time": "1 day, 12:09:41", "throughput": 337.93, "total_tokens": 6726528} {"current_steps": 5310, "total_steps": 40000, "loss": 0.0961, "lr": 0.28714816765285434, "epoch": 0.2594483668433782, "percentage": 13.28, "elapsed_time": "5:31:48", "remaining_time": "1 day, 12:07:40", "throughput": 338.18, "total_tokens": 6732576} {"current_steps": 5315, "total_steps": 40000, "loss": 0.0881, "lr": 0.28712430119877896, "epoch": 0.2596926685070725, "percentage": 13.29, "elapsed_time": "5:31:51", "remaining_time": "1 day, 12:05:39", "throughput": 338.44, "total_tokens": 6738720} {"current_steps": 5320, "total_steps": 40000, "loss": 0.1012, "lr": 0.28710041359841304, "epoch": 0.2599369701707669, "percentage": 13.3, "elapsed_time": "5:31:54", "remaining_time": "1 day, 12:03:38", "throughput": 338.69, "total_tokens": 6744768} {"current_steps": 5325, "total_steps": 40000, "loss": 0.0545, "lr": 0.28707650485544056, "epoch": 0.2601812718344612, "percentage": 13.31, "elapsed_time": "5:31:57", "remaining_time": "1 day, 12:01:38", "throughput": 338.98, "total_tokens": 6751744} {"current_steps": 5330, "total_steps": 40000, "loss": 0.0635, "lr": 0.28705257497354836, "epoch": 0.26042557349815554, "percentage": 13.33, "elapsed_time": "5:32:00", "remaining_time": "1 day, 11:59:38", "throughput": 339.23, "total_tokens": 6757760} {"current_steps": 5335, "total_steps": 40000, "loss": 0.0692, "lr": 0.28702862395642675, "epoch": 0.26066987516184986, "percentage": 13.34, "elapsed_time": "5:32:03", "remaining_time": "1 day, 11:57:37", "throughput": 339.49, "total_tokens": 6763840} {"current_steps": 5340, "total_steps": 40000, "loss": 0.0634, "lr": 0.28700465180776935, "epoch": 0.2609141768255442, "percentage": 13.35, "elapsed_time": "5:32:06", "remaining_time": "1 day, 11:55:38", "throughput": 339.78, "total_tokens": 6770784} {"current_steps": 5345, "total_steps": 40000, "loss": 0.0967, "lr": 0.2869806585312729, "epoch": 0.2611584784892385, "percentage": 13.36, "elapsed_time": "5:32:09", "remaining_time": "1 day, 11:53:38", "throughput": 340.04, "total_tokens": 6777088} {"current_steps": 5350, "total_steps": 40000, "loss": 0.0712, "lr": 0.28695664413063754, "epoch": 0.26140278015293283, "percentage": 13.38, "elapsed_time": "5:32:13", "remaining_time": "1 day, 11:51:39", "throughput": 340.32, "total_tokens": 6783552} {"current_steps": 5355, "total_steps": 40000, "loss": 0.0935, "lr": 0.28693260860956654, "epoch": 0.26164708181662716, "percentage": 13.39, "elapsed_time": "5:32:16", "remaining_time": "1 day, 11:49:39", "throughput": 340.57, "total_tokens": 6789568} {"current_steps": 5360, "total_steps": 40000, "loss": 0.047, "lr": 0.2869085519717665, "epoch": 0.2618913834803215, "percentage": 13.4, "elapsed_time": "5:32:19", "remaining_time": "1 day, 11:47:40", "throughput": 340.83, "total_tokens": 6795936} {"current_steps": 5365, "total_steps": 40000, "loss": 0.0889, "lr": 0.28688447422094726, "epoch": 0.2621356851440158, "percentage": 13.41, "elapsed_time": "5:32:22", "remaining_time": "1 day, 11:45:42", "throughput": 341.11, "total_tokens": 6802464} {"current_steps": 5370, "total_steps": 40000, "loss": 0.0871, "lr": 0.2868603753608219, "epoch": 0.2623799868077102, "percentage": 13.43, "elapsed_time": "5:32:25", "remaining_time": "1 day, 11:43:43", "throughput": 341.37, "total_tokens": 6808704} {"current_steps": 5375, "total_steps": 40000, "loss": 0.0673, "lr": 0.28683625539510665, "epoch": 0.2626242884714045, "percentage": 13.44, "elapsed_time": "5:32:28", "remaining_time": "1 day, 11:41:44", "throughput": 341.62, "total_tokens": 6814848} {"current_steps": 5380, "total_steps": 40000, "loss": 0.074, "lr": 0.28681211432752135, "epoch": 0.26286859013509883, "percentage": 13.45, "elapsed_time": "5:32:31", "remaining_time": "1 day, 11:39:46", "throughput": 341.89, "total_tokens": 6821184} {"current_steps": 5385, "total_steps": 40000, "loss": 0.0801, "lr": 0.2867879521617887, "epoch": 0.26311289179879316, "percentage": 13.46, "elapsed_time": "5:32:34", "remaining_time": "1 day, 11:37:48", "throughput": 342.15, "total_tokens": 6827488} {"current_steps": 5390, "total_steps": 40000, "loss": 0.0811, "lr": 0.28676376890163485, "epoch": 0.2633571934624875, "percentage": 13.48, "elapsed_time": "5:32:37", "remaining_time": "1 day, 11:35:50", "throughput": 342.41, "total_tokens": 6833696} {"current_steps": 5395, "total_steps": 40000, "loss": 0.067, "lr": 0.2867395645507891, "epoch": 0.2636014951261818, "percentage": 13.49, "elapsed_time": "5:32:40", "remaining_time": "1 day, 11:33:54", "throughput": 342.69, "total_tokens": 6840288} {"current_steps": 5400, "total_steps": 40000, "loss": 0.0593, "lr": 0.2867153391129842, "epoch": 0.26384579678987613, "percentage": 13.5, "elapsed_time": "5:32:43", "remaining_time": "1 day, 11:31:57", "throughput": 342.98, "total_tokens": 6847232} {"current_steps": 5400, "total_steps": 40000, "eval_loss": 0.07613344490528107, "epoch": 0.26384579678987613, "percentage": 13.5, "elapsed_time": "5:43:22", "remaining_time": "1 day, 12:40:10", "throughput": 332.35, "total_tokens": 6847232} {"current_steps": 5405, "total_steps": 40000, "loss": 0.0766, "lr": 0.28669109259195585, "epoch": 0.26409009845357045, "percentage": 13.51, "elapsed_time": "5:43:26", "remaining_time": "1 day, 12:38:14", "throughput": 332.59, "total_tokens": 6853536} {"current_steps": 5410, "total_steps": 40000, "loss": 0.0461, "lr": 0.2866668249914433, "epoch": 0.2643344001172648, "percentage": 13.53, "elapsed_time": "5:43:29", "remaining_time": "1 day, 12:36:12", "throughput": 332.85, "total_tokens": 6859936} {"current_steps": 5415, "total_steps": 40000, "loss": 0.0824, "lr": 0.2866425363151889, "epoch": 0.2645787017809591, "percentage": 13.54, "elapsed_time": "5:43:32", "remaining_time": "1 day, 12:34:11", "throughput": 333.09, "total_tokens": 6865856} {"current_steps": 5420, "total_steps": 40000, "loss": 0.0563, "lr": 0.2866182265669382, "epoch": 0.2648230034446535, "percentage": 13.55, "elapsed_time": "5:43:35", "remaining_time": "1 day, 12:32:10", "throughput": 333.32, "total_tokens": 6871744} {"current_steps": 5425, "total_steps": 40000, "loss": 0.0758, "lr": 0.28659389575044014, "epoch": 0.2650673051083478, "percentage": 13.56, "elapsed_time": "5:43:38", "remaining_time": "1 day, 12:30:09", "throughput": 333.59, "total_tokens": 6878208} {"current_steps": 5430, "total_steps": 40000, "loss": 0.0674, "lr": 0.28656954386944683, "epoch": 0.26531160677204213, "percentage": 13.58, "elapsed_time": "5:43:41", "remaining_time": "1 day, 12:28:09", "throughput": 333.82, "total_tokens": 6884032} {"current_steps": 5435, "total_steps": 40000, "loss": 0.0768, "lr": 0.28654517092771353, "epoch": 0.26555590843573645, "percentage": 13.59, "elapsed_time": "5:43:45", "remaining_time": "1 day, 12:26:09", "throughput": 334.08, "total_tokens": 6890432} {"current_steps": 5440, "total_steps": 40000, "loss": 0.0786, "lr": 0.286520776928999, "epoch": 0.2658002100994308, "percentage": 13.6, "elapsed_time": "5:43:48", "remaining_time": "1 day, 12:24:09", "throughput": 334.34, "total_tokens": 6896736} {"current_steps": 5445, "total_steps": 40000, "loss": 0.1048, "lr": 0.286496361877065, "epoch": 0.2660445117631251, "percentage": 13.61, "elapsed_time": "5:43:51", "remaining_time": "1 day, 12:22:10", "throughput": 334.6, "total_tokens": 6903328} {"current_steps": 5450, "total_steps": 40000, "loss": 0.105, "lr": 0.28647192577567676, "epoch": 0.2662888134268194, "percentage": 13.63, "elapsed_time": "5:43:54", "remaining_time": "1 day, 12:20:10", "throughput": 334.87, "total_tokens": 6909888} {"current_steps": 5455, "total_steps": 40000, "loss": 0.0742, "lr": 0.28644746862860254, "epoch": 0.26653311509051375, "percentage": 13.64, "elapsed_time": "5:43:57", "remaining_time": "1 day, 12:18:11", "throughput": 335.13, "total_tokens": 6916256} {"current_steps": 5460, "total_steps": 40000, "loss": 0.0817, "lr": 0.2864229904396139, "epoch": 0.2667774167542081, "percentage": 13.65, "elapsed_time": "5:44:00", "remaining_time": "1 day, 12:16:12", "throughput": 335.39, "total_tokens": 6922752} {"current_steps": 5465, "total_steps": 40000, "loss": 0.1091, "lr": 0.28639849121248573, "epoch": 0.2670217184179024, "percentage": 13.66, "elapsed_time": "5:44:03", "remaining_time": "1 day, 12:14:14", "throughput": 335.66, "total_tokens": 6929248} {"current_steps": 5470, "total_steps": 40000, "loss": 0.0998, "lr": 0.28637397095099615, "epoch": 0.2672660200815968, "percentage": 13.68, "elapsed_time": "5:44:06", "remaining_time": "1 day, 12:12:15", "throughput": 335.92, "total_tokens": 6935680} {"current_steps": 5475, "total_steps": 40000, "loss": 0.0776, "lr": 0.28634942965892646, "epoch": 0.2675103217452911, "percentage": 13.69, "elapsed_time": "5:44:10", "remaining_time": "1 day, 12:10:17", "throughput": 336.19, "total_tokens": 6942272} {"current_steps": 5480, "total_steps": 40000, "loss": 0.0481, "lr": 0.28632486734006124, "epoch": 0.2677546234089854, "percentage": 13.7, "elapsed_time": "5:44:13", "remaining_time": "1 day, 12:08:19", "throughput": 336.45, "total_tokens": 6948800} {"current_steps": 5485, "total_steps": 40000, "loss": 0.106, "lr": 0.28630028399818835, "epoch": 0.26799892507267975, "percentage": 13.71, "elapsed_time": "5:44:16", "remaining_time": "1 day, 12:06:21", "throughput": 336.7, "total_tokens": 6955008} {"current_steps": 5490, "total_steps": 40000, "loss": 0.0463, "lr": 0.2862756796370987, "epoch": 0.2682432267363741, "percentage": 13.73, "elapsed_time": "5:44:19", "remaining_time": "1 day, 12:04:23", "throughput": 336.96, "total_tokens": 6961312} {"current_steps": 5495, "total_steps": 40000, "loss": 0.0641, "lr": 0.2862510542605868, "epoch": 0.2684875284000684, "percentage": 13.74, "elapsed_time": "5:44:22", "remaining_time": "1 day, 12:02:26", "throughput": 337.23, "total_tokens": 6968064} {"current_steps": 5500, "total_steps": 40000, "loss": 0.098, "lr": 0.2862264078724501, "epoch": 0.2687318300637627, "percentage": 13.75, "elapsed_time": "5:44:25", "remaining_time": "1 day, 12:00:29", "throughput": 337.49, "total_tokens": 6974336} {"current_steps": 5505, "total_steps": 40000, "loss": 0.0811, "lr": 0.28620174047648933, "epoch": 0.26897613172745705, "percentage": 13.76, "elapsed_time": "5:44:28", "remaining_time": "1 day, 11:58:32", "throughput": 337.75, "total_tokens": 6980736} {"current_steps": 5510, "total_steps": 40000, "loss": 0.0706, "lr": 0.2861770520765086, "epoch": 0.26922043339115137, "percentage": 13.78, "elapsed_time": "5:44:31", "remaining_time": "1 day, 11:56:35", "throughput": 337.99, "total_tokens": 6986912} {"current_steps": 5515, "total_steps": 40000, "loss": 0.0559, "lr": 0.2861523426763151, "epoch": 0.26946473505484575, "percentage": 13.79, "elapsed_time": "5:44:34", "remaining_time": "1 day, 11:54:38", "throughput": 338.27, "total_tokens": 6993760} {"current_steps": 5520, "total_steps": 40000, "loss": 0.0459, "lr": 0.2861276122797194, "epoch": 0.2697090367185401, "percentage": 13.8, "elapsed_time": "5:44:38", "remaining_time": "1 day, 11:52:42", "throughput": 338.55, "total_tokens": 7000448} {"current_steps": 5525, "total_steps": 40000, "loss": 0.0694, "lr": 0.28610286089053516, "epoch": 0.2699533383822344, "percentage": 13.81, "elapsed_time": "5:44:41", "remaining_time": "1 day, 11:50:45", "throughput": 338.79, "total_tokens": 7006624} {"current_steps": 5530, "total_steps": 40000, "loss": 0.1219, "lr": 0.28607808851257943, "epoch": 0.2701976400459287, "percentage": 13.83, "elapsed_time": "5:44:44", "remaining_time": "1 day, 11:48:49", "throughput": 339.06, "total_tokens": 7013184} {"current_steps": 5535, "total_steps": 40000, "loss": 0.1066, "lr": 0.28605329514967237, "epoch": 0.27044194170962305, "percentage": 13.84, "elapsed_time": "5:44:47", "remaining_time": "1 day, 11:46:54", "throughput": 339.32, "total_tokens": 7019680} {"current_steps": 5540, "total_steps": 40000, "loss": 0.0622, "lr": 0.2860284808056374, "epoch": 0.27068624337331737, "percentage": 13.85, "elapsed_time": "5:44:50", "remaining_time": "1 day, 11:44:58", "throughput": 339.59, "total_tokens": 7026176} {"current_steps": 5545, "total_steps": 40000, "loss": 0.0726, "lr": 0.28600364548430135, "epoch": 0.2709305450370117, "percentage": 13.86, "elapsed_time": "5:44:53", "remaining_time": "1 day, 11:43:03", "throughput": 339.84, "total_tokens": 7032384} {"current_steps": 5550, "total_steps": 40000, "loss": 0.0776, "lr": 0.28597878918949393, "epoch": 0.271174846700706, "percentage": 13.88, "elapsed_time": "5:44:56", "remaining_time": "1 day, 11:41:07", "throughput": 340.08, "total_tokens": 7038496} {"current_steps": 5555, "total_steps": 40000, "loss": 0.0722, "lr": 0.2859539119250485, "epoch": 0.27141914836440034, "percentage": 13.89, "elapsed_time": "5:44:59", "remaining_time": "1 day, 11:39:12", "throughput": 340.34, "total_tokens": 7044896} {"current_steps": 5560, "total_steps": 40000, "loss": 0.0596, "lr": 0.2859290136948013, "epoch": 0.27166345002809467, "percentage": 13.9, "elapsed_time": "5:45:02", "remaining_time": "1 day, 11:37:17", "throughput": 340.59, "total_tokens": 7051200} {"current_steps": 5565, "total_steps": 40000, "loss": 0.0746, "lr": 0.28590409450259197, "epoch": 0.27190775169178905, "percentage": 13.91, "elapsed_time": "5:45:05", "remaining_time": "1 day, 11:35:23", "throughput": 340.85, "total_tokens": 7057568} {"current_steps": 5570, "total_steps": 40000, "loss": 0.0522, "lr": 0.28587915435226346, "epoch": 0.27215205335548337, "percentage": 13.93, "elapsed_time": "5:45:08", "remaining_time": "1 day, 11:33:28", "throughput": 341.1, "total_tokens": 7063840} {"current_steps": 5575, "total_steps": 40000, "loss": 0.0468, "lr": 0.2858541932476617, "epoch": 0.2723963550191777, "percentage": 13.94, "elapsed_time": "5:45:12", "remaining_time": "1 day, 11:31:34", "throughput": 341.38, "total_tokens": 7070784} {"current_steps": 5580, "total_steps": 40000, "loss": 0.0963, "lr": 0.2858292111926361, "epoch": 0.272640656682872, "percentage": 13.95, "elapsed_time": "5:45:15", "remaining_time": "1 day, 11:29:40", "throughput": 341.64, "total_tokens": 7077024} {"current_steps": 5585, "total_steps": 40000, "loss": 0.0764, "lr": 0.28580420819103924, "epoch": 0.27288495834656634, "percentage": 13.96, "elapsed_time": "5:45:18", "remaining_time": "1 day, 11:27:46", "throughput": 341.87, "total_tokens": 7082848} {"current_steps": 5590, "total_steps": 40000, "loss": 0.0608, "lr": 0.2857791842467269, "epoch": 0.27312926001026067, "percentage": 13.98, "elapsed_time": "5:45:21", "remaining_time": "1 day, 11:25:52", "throughput": 342.13, "total_tokens": 7089344} {"current_steps": 5595, "total_steps": 40000, "loss": 0.0634, "lr": 0.2857541393635579, "epoch": 0.273373561673955, "percentage": 13.99, "elapsed_time": "5:45:24", "remaining_time": "1 day, 11:23:58", "throughput": 342.38, "total_tokens": 7095552} {"current_steps": 5600, "total_steps": 40000, "loss": 0.08, "lr": 0.2857290735453948, "epoch": 0.2736178633376493, "percentage": 14.0, "elapsed_time": "5:45:27", "remaining_time": "1 day, 11:22:05", "throughput": 342.64, "total_tokens": 7101984} {"current_steps": 5600, "total_steps": 40000, "eval_loss": 0.07504525780677795, "epoch": 0.2736178633376493, "percentage": 14.0, "elapsed_time": "5:56:06", "remaining_time": "1 day, 12:27:30", "throughput": 332.39, "total_tokens": 7101984} {"current_steps": 5605, "total_steps": 40000, "loss": 0.0647, "lr": 0.28570398679610276, "epoch": 0.27386216500134364, "percentage": 14.01, "elapsed_time": "5:56:10", "remaining_time": "1 day, 12:25:37", "throughput": 332.63, "total_tokens": 7108256} {"current_steps": 5610, "total_steps": 40000, "loss": 0.0841, "lr": 0.2856788791195506, "epoch": 0.27410646666503796, "percentage": 14.03, "elapsed_time": "5:56:13", "remaining_time": "1 day, 12:23:41", "throughput": 332.93, "total_tokens": 7115776} {"current_steps": 5615, "total_steps": 40000, "loss": 0.0709, "lr": 0.28565375051961023, "epoch": 0.27435076832873234, "percentage": 14.04, "elapsed_time": "5:56:16", "remaining_time": "1 day, 12:21:45", "throughput": 333.18, "total_tokens": 7122144} {"current_steps": 5620, "total_steps": 40000, "loss": 0.062, "lr": 0.28562860100015686, "epoch": 0.27459506999242667, "percentage": 14.05, "elapsed_time": "5:56:19", "remaining_time": "1 day, 12:19:48", "throughput": 333.43, "total_tokens": 7128608} {"current_steps": 5625, "total_steps": 40000, "loss": 0.0874, "lr": 0.2856034305650687, "epoch": 0.274839371656121, "percentage": 14.06, "elapsed_time": "5:56:22", "remaining_time": "1 day, 12:17:52", "throughput": 333.68, "total_tokens": 7134976} {"current_steps": 5630, "total_steps": 40000, "loss": 0.0568, "lr": 0.28557823921822756, "epoch": 0.2750836733198153, "percentage": 14.07, "elapsed_time": "5:56:25", "remaining_time": "1 day, 12:15:56", "throughput": 333.93, "total_tokens": 7141408} {"current_steps": 5635, "total_steps": 40000, "loss": 0.0689, "lr": 0.2855530269635181, "epoch": 0.27532797498350964, "percentage": 14.09, "elapsed_time": "5:56:28", "remaining_time": "1 day, 12:13:59", "throughput": 334.17, "total_tokens": 7147424} {"current_steps": 5640, "total_steps": 40000, "loss": 0.0929, "lr": 0.2855277938048284, "epoch": 0.27557227664720396, "percentage": 14.1, "elapsed_time": "5:56:31", "remaining_time": "1 day, 12:12:03", "throughput": 334.41, "total_tokens": 7153600} {"current_steps": 5645, "total_steps": 40000, "loss": 0.1021, "lr": 0.2855025397460498, "epoch": 0.2758165783108983, "percentage": 14.11, "elapsed_time": "5:56:35", "remaining_time": "1 day, 12:10:09", "throughput": 334.68, "total_tokens": 7160448} {"current_steps": 5650, "total_steps": 40000, "loss": 0.0798, "lr": 0.28547726479107666, "epoch": 0.2760608799745926, "percentage": 14.12, "elapsed_time": "5:56:38", "remaining_time": "1 day, 12:08:13", "throughput": 334.91, "total_tokens": 7166560} {"current_steps": 5655, "total_steps": 40000, "loss": 0.0883, "lr": 0.2854519689438068, "epoch": 0.27630518163828693, "percentage": 14.14, "elapsed_time": "5:56:41", "remaining_time": "1 day, 12:06:17", "throughput": 335.16, "total_tokens": 7172832} {"current_steps": 5660, "total_steps": 40000, "loss": 0.0826, "lr": 0.2854266522081412, "epoch": 0.2765494833019813, "percentage": 14.15, "elapsed_time": "5:56:44", "remaining_time": "1 day, 12:04:23", "throughput": 335.43, "total_tokens": 7179616} {"current_steps": 5665, "total_steps": 40000, "loss": 0.0626, "lr": 0.28540131458798385, "epoch": 0.27679378496567564, "percentage": 14.16, "elapsed_time": "5:56:47", "remaining_time": "1 day, 12:02:28", "throughput": 335.67, "total_tokens": 7185792} {"current_steps": 5670, "total_steps": 40000, "loss": 0.0855, "lr": 0.28537595608724226, "epoch": 0.27703808662936996, "percentage": 14.17, "elapsed_time": "5:56:50", "remaining_time": "1 day, 12:00:34", "throughput": 335.91, "total_tokens": 7191968} {"current_steps": 5675, "total_steps": 40000, "loss": 0.0944, "lr": 0.28535057670982705, "epoch": 0.2772823882930643, "percentage": 14.19, "elapsed_time": "5:56:53", "remaining_time": "1 day, 11:58:39", "throughput": 336.15, "total_tokens": 7198272} {"current_steps": 5680, "total_steps": 40000, "loss": 0.1427, "lr": 0.285325176459652, "epoch": 0.2775266899567586, "percentage": 14.2, "elapsed_time": "5:56:56", "remaining_time": "1 day, 11:56:45", "throughput": 336.38, "total_tokens": 7204224} {"current_steps": 5685, "total_steps": 40000, "loss": 0.0611, "lr": 0.28529975534063406, "epoch": 0.27777099162045293, "percentage": 14.21, "elapsed_time": "5:56:59", "remaining_time": "1 day, 11:54:51", "throughput": 336.64, "total_tokens": 7210880} {"current_steps": 5690, "total_steps": 40000, "loss": 0.0838, "lr": 0.2852743133566936, "epoch": 0.27801529328414726, "percentage": 14.22, "elapsed_time": "5:57:02", "remaining_time": "1 day, 11:52:57", "throughput": 336.88, "total_tokens": 7216928} {"current_steps": 5695, "total_steps": 40000, "loss": 0.0706, "lr": 0.2852488505117541, "epoch": 0.2782595949478416, "percentage": 14.24, "elapsed_time": "5:57:05", "remaining_time": "1 day, 11:51:03", "throughput": 337.14, "total_tokens": 7223488} {"current_steps": 5700, "total_steps": 40000, "loss": 0.1021, "lr": 0.28522336680974214, "epoch": 0.2785038966115359, "percentage": 14.25, "elapsed_time": "5:57:09", "remaining_time": "1 day, 11:49:10", "throughput": 337.38, "total_tokens": 7229728} {"current_steps": 5705, "total_steps": 40000, "loss": 0.0613, "lr": 0.2851978622545877, "epoch": 0.27874819827523023, "percentage": 14.26, "elapsed_time": "5:57:12", "remaining_time": "1 day, 11:47:17", "throughput": 337.63, "total_tokens": 7236160} {"current_steps": 5710, "total_steps": 40000, "loss": 0.0376, "lr": 0.285172336850224, "epoch": 0.2789924999389246, "percentage": 14.27, "elapsed_time": "5:57:15", "remaining_time": "1 day, 11:45:23", "throughput": 337.87, "total_tokens": 7242336} {"current_steps": 5715, "total_steps": 40000, "loss": 0.0544, "lr": 0.2851467906005871, "epoch": 0.27923680160261893, "percentage": 14.29, "elapsed_time": "5:57:18", "remaining_time": "1 day, 11:43:30", "throughput": 338.11, "total_tokens": 7248576} {"current_steps": 5720, "total_steps": 40000, "loss": 0.0731, "lr": 0.28512122350961683, "epoch": 0.27948110326631326, "percentage": 14.3, "elapsed_time": "5:57:21", "remaining_time": "1 day, 11:41:38", "throughput": 338.35, "total_tokens": 7254720} {"current_steps": 5725, "total_steps": 40000, "loss": 0.0769, "lr": 0.2850956355812559, "epoch": 0.2797254049300076, "percentage": 14.31, "elapsed_time": "5:57:24", "remaining_time": "1 day, 11:39:45", "throughput": 338.6, "total_tokens": 7261152} {"current_steps": 5730, "total_steps": 40000, "loss": 0.0781, "lr": 0.28507002681945015, "epoch": 0.2799697065937019, "percentage": 14.32, "elapsed_time": "5:57:27", "remaining_time": "1 day, 11:37:53", "throughput": 338.85, "total_tokens": 7267392} {"current_steps": 5735, "total_steps": 40000, "loss": 0.0835, "lr": 0.28504439722814895, "epoch": 0.28021400825739623, "percentage": 14.34, "elapsed_time": "5:57:30", "remaining_time": "1 day, 11:36:02", "throughput": 339.11, "total_tokens": 7274208} {"current_steps": 5740, "total_steps": 40000, "loss": 0.0524, "lr": 0.28501874681130457, "epoch": 0.28045830992109055, "percentage": 14.35, "elapsed_time": "5:57:33", "remaining_time": "1 day, 11:34:09", "throughput": 339.34, "total_tokens": 7280096} {"current_steps": 5745, "total_steps": 40000, "loss": 0.0575, "lr": 0.2849930755728727, "epoch": 0.2807026115847849, "percentage": 14.36, "elapsed_time": "5:57:36", "remaining_time": "1 day, 11:32:18", "throughput": 339.61, "total_tokens": 7286880} {"current_steps": 5750, "total_steps": 40000, "loss": 0.0719, "lr": 0.28496738351681217, "epoch": 0.2809469132484792, "percentage": 14.37, "elapsed_time": "5:57:40", "remaining_time": "1 day, 11:30:27", "throughput": 339.85, "total_tokens": 7293280} {"current_steps": 5755, "total_steps": 40000, "loss": 0.0727, "lr": 0.284941670647085, "epoch": 0.2811912149121735, "percentage": 14.39, "elapsed_time": "5:57:43", "remaining_time": "1 day, 11:28:35", "throughput": 340.08, "total_tokens": 7299232} {"current_steps": 5760, "total_steps": 40000, "loss": 0.0704, "lr": 0.2849159369676563, "epoch": 0.2814355165758679, "percentage": 14.4, "elapsed_time": "5:57:46", "remaining_time": "1 day, 11:26:45", "throughput": 340.35, "total_tokens": 7306048} {"current_steps": 5765, "total_steps": 40000, "loss": 0.0589, "lr": 0.2848901824824948, "epoch": 0.28167981823956223, "percentage": 14.41, "elapsed_time": "5:57:49", "remaining_time": "1 day, 11:24:53", "throughput": 340.59, "total_tokens": 7312224} {"current_steps": 5770, "total_steps": 40000, "loss": 0.0641, "lr": 0.284864407195572, "epoch": 0.28192411990325655, "percentage": 14.42, "elapsed_time": "5:57:52", "remaining_time": "1 day, 11:23:02", "throughput": 340.82, "total_tokens": 7318144} {"current_steps": 5775, "total_steps": 40000, "loss": 0.0445, "lr": 0.28483861111086284, "epoch": 0.2821684215669509, "percentage": 14.44, "elapsed_time": "5:57:55", "remaining_time": "1 day, 11:21:12", "throughput": 341.09, "total_tokens": 7325120} {"current_steps": 5780, "total_steps": 40000, "loss": 0.0858, "lr": 0.2848127942323453, "epoch": 0.2824127232306452, "percentage": 14.45, "elapsed_time": "5:57:58", "remaining_time": "1 day, 11:19:22", "throughput": 341.36, "total_tokens": 7332064} {"current_steps": 5785, "total_steps": 40000, "loss": 0.0831, "lr": 0.2847869565640007, "epoch": 0.2826570248943395, "percentage": 14.46, "elapsed_time": "5:58:01", "remaining_time": "1 day, 11:17:33", "throughput": 341.63, "total_tokens": 7338848} {"current_steps": 5790, "total_steps": 40000, "loss": 0.1067, "lr": 0.2847610981098136, "epoch": 0.28290132655803385, "percentage": 14.47, "elapsed_time": "5:58:04", "remaining_time": "1 day, 11:15:43", "throughput": 341.87, "total_tokens": 7345024} {"current_steps": 5795, "total_steps": 40000, "loss": 0.0957, "lr": 0.2847352188737716, "epoch": 0.2831456282217282, "percentage": 14.49, "elapsed_time": "5:58:08", "remaining_time": "1 day, 11:13:53", "throughput": 342.12, "total_tokens": 7351488} {"current_steps": 5800, "total_steps": 40000, "loss": 0.0944, "lr": 0.2847093188598658, "epoch": 0.2833899298854225, "percentage": 14.5, "elapsed_time": "5:58:11", "remaining_time": "1 day, 11:12:03", "throughput": 342.35, "total_tokens": 7357536} {"current_steps": 5800, "total_steps": 40000, "eval_loss": 0.08094930648803711, "epoch": 0.2833899298854225, "percentage": 14.5, "elapsed_time": "6:08:49", "remaining_time": "1 day, 12:14:50", "throughput": 332.47, "total_tokens": 7357536} {"current_steps": 5805, "total_steps": 40000, "loss": 0.0697, "lr": 0.28468339807209003, "epoch": 0.2836342315491168, "percentage": 14.51, "elapsed_time": "6:08:53", "remaining_time": "1 day, 12:13:00", "throughput": 332.72, "total_tokens": 7364256} {"current_steps": 5810, "total_steps": 40000, "loss": 0.0771, "lr": 0.2846574565144418, "epoch": 0.2838785332128112, "percentage": 14.52, "elapsed_time": "6:08:56", "remaining_time": "1 day, 12:11:07", "throughput": 332.97, "total_tokens": 7370784} {"current_steps": 5815, "total_steps": 40000, "loss": 0.0688, "lr": 0.28463149419092154, "epoch": 0.2841228348765055, "percentage": 14.54, "elapsed_time": "6:08:59", "remaining_time": "1 day, 12:09:14", "throughput": 333.19, "total_tokens": 7376800} {"current_steps": 5820, "total_steps": 40000, "loss": 0.0744, "lr": 0.284605511105533, "epoch": 0.28436713654019985, "percentage": 14.55, "elapsed_time": "6:09:02", "remaining_time": "1 day, 12:07:22", "throughput": 333.43, "total_tokens": 7383072} {"current_steps": 5825, "total_steps": 40000, "loss": 0.0469, "lr": 0.28457950726228315, "epoch": 0.2846114382038942, "percentage": 14.56, "elapsed_time": "6:09:06", "remaining_time": "1 day, 12:05:29", "throughput": 333.67, "total_tokens": 7389504} {"current_steps": 5830, "total_steps": 40000, "loss": 0.0512, "lr": 0.28455348266518193, "epoch": 0.2848557398675885, "percentage": 14.57, "elapsed_time": "6:09:09", "remaining_time": "1 day, 12:03:37", "throughput": 333.91, "total_tokens": 7395840} {"current_steps": 5835, "total_steps": 40000, "loss": 0.0961, "lr": 0.28452743731824287, "epoch": 0.2851000415312828, "percentage": 14.59, "elapsed_time": "6:09:12", "remaining_time": "1 day, 12:01:45", "throughput": 334.16, "total_tokens": 7402304} {"current_steps": 5840, "total_steps": 40000, "loss": 0.0466, "lr": 0.28450137122548236, "epoch": 0.28534434319497715, "percentage": 14.6, "elapsed_time": "6:09:15", "remaining_time": "1 day, 11:59:53", "throughput": 334.41, "total_tokens": 7408928} {"current_steps": 5845, "total_steps": 40000, "loss": 0.0544, "lr": 0.2844752843909201, "epoch": 0.28558864485867147, "percentage": 14.61, "elapsed_time": "6:09:18", "remaining_time": "1 day, 11:58:00", "throughput": 334.64, "total_tokens": 7415072} {"current_steps": 5850, "total_steps": 40000, "loss": 0.091, "lr": 0.28444917681857923, "epoch": 0.2858329465223658, "percentage": 14.62, "elapsed_time": "6:09:21", "remaining_time": "1 day, 11:56:08", "throughput": 334.86, "total_tokens": 7420960} {"current_steps": 5855, "total_steps": 40000, "loss": 0.0619, "lr": 0.28442304851248557, "epoch": 0.2860772481860602, "percentage": 14.64, "elapsed_time": "6:09:24", "remaining_time": "1 day, 11:54:16", "throughput": 335.08, "total_tokens": 7426848} {"current_steps": 5860, "total_steps": 40000, "loss": 0.0779, "lr": 0.2843968994766686, "epoch": 0.2863215498497545, "percentage": 14.65, "elapsed_time": "6:09:27", "remaining_time": "1 day, 11:52:26", "throughput": 335.34, "total_tokens": 7433728} {"current_steps": 5865, "total_steps": 40000, "loss": 0.0987, "lr": 0.28437072971516075, "epoch": 0.2865658515134488, "percentage": 14.66, "elapsed_time": "6:09:30", "remaining_time": "1 day, 11:50:35", "throughput": 335.59, "total_tokens": 7440224} {"current_steps": 5870, "total_steps": 40000, "loss": 0.1005, "lr": 0.2843445392319979, "epoch": 0.28681015317714315, "percentage": 14.67, "elapsed_time": "6:09:33", "remaining_time": "1 day, 11:48:44", "throughput": 335.82, "total_tokens": 7446368} {"current_steps": 5875, "total_steps": 40000, "loss": 0.0698, "lr": 0.28431832803121865, "epoch": 0.28705445484083747, "percentage": 14.69, "elapsed_time": "6:09:36", "remaining_time": "1 day, 11:46:53", "throughput": 336.07, "total_tokens": 7453024} {"current_steps": 5880, "total_steps": 40000, "loss": 0.0781, "lr": 0.28429209611686534, "epoch": 0.2872987565045318, "percentage": 14.7, "elapsed_time": "6:09:39", "remaining_time": "1 day, 11:45:03", "throughput": 336.31, "total_tokens": 7459360} {"current_steps": 5885, "total_steps": 40000, "loss": 0.0636, "lr": 0.28426584349298323, "epoch": 0.2875430581682261, "percentage": 14.71, "elapsed_time": "6:09:42", "remaining_time": "1 day, 11:43:12", "throughput": 336.54, "total_tokens": 7465472} {"current_steps": 5890, "total_steps": 40000, "loss": 0.0708, "lr": 0.2842395701636207, "epoch": 0.28778735983192044, "percentage": 14.72, "elapsed_time": "6:09:45", "remaining_time": "1 day, 11:41:22", "throughput": 336.79, "total_tokens": 7471904} {"current_steps": 5895, "total_steps": 40000, "loss": 0.0611, "lr": 0.28421327613282954, "epoch": 0.28803166149561477, "percentage": 14.74, "elapsed_time": "6:09:49", "remaining_time": "1 day, 11:39:32", "throughput": 337.04, "total_tokens": 7478528} {"current_steps": 5900, "total_steps": 40000, "loss": 0.0342, "lr": 0.28418696140466454, "epoch": 0.2882759631593091, "percentage": 14.75, "elapsed_time": "6:09:52", "remaining_time": "1 day, 11:37:42", "throughput": 337.26, "total_tokens": 7484544} {"current_steps": 5905, "total_steps": 40000, "loss": 0.098, "lr": 0.2841606259831838, "epoch": 0.28852026482300347, "percentage": 14.76, "elapsed_time": "6:09:55", "remaining_time": "1 day, 11:35:53", "throughput": 337.51, "total_tokens": 7491072} {"current_steps": 5910, "total_steps": 40000, "loss": 0.0732, "lr": 0.2841342698724486, "epoch": 0.2887645664866978, "percentage": 14.77, "elapsed_time": "6:09:58", "remaining_time": "1 day, 11:34:03", "throughput": 337.74, "total_tokens": 7497312} {"current_steps": 5915, "total_steps": 40000, "loss": 0.0686, "lr": 0.28410789307652334, "epoch": 0.2890088681503921, "percentage": 14.79, "elapsed_time": "6:10:01", "remaining_time": "1 day, 11:32:15", "throughput": 338.0, "total_tokens": 7504128} {"current_steps": 5920, "total_steps": 40000, "loss": 0.0923, "lr": 0.2840814955994756, "epoch": 0.28925316981408644, "percentage": 14.8, "elapsed_time": "6:10:04", "remaining_time": "1 day, 11:30:26", "throughput": 338.24, "total_tokens": 7510496} {"current_steps": 5925, "total_steps": 40000, "loss": 0.0861, "lr": 0.2840550774453763, "epoch": 0.28949747147778077, "percentage": 14.81, "elapsed_time": "6:10:07", "remaining_time": "1 day, 11:28:36", "throughput": 338.47, "total_tokens": 7516640} {"current_steps": 5930, "total_steps": 40000, "loss": 0.071, "lr": 0.28402863861829947, "epoch": 0.2897417731414751, "percentage": 14.82, "elapsed_time": "6:10:10", "remaining_time": "1 day, 11:26:48", "throughput": 338.71, "total_tokens": 7522912} {"current_steps": 5935, "total_steps": 40000, "loss": 0.0557, "lr": 0.2840021791223222, "epoch": 0.2899860748051694, "percentage": 14.84, "elapsed_time": "6:10:13", "remaining_time": "1 day, 11:24:59", "throughput": 338.93, "total_tokens": 7528832} {"current_steps": 5940, "total_steps": 40000, "loss": 0.0604, "lr": 0.2839756989615249, "epoch": 0.29023037646886374, "percentage": 14.85, "elapsed_time": "6:10:16", "remaining_time": "1 day, 11:23:11", "throughput": 339.18, "total_tokens": 7535488} {"current_steps": 5945, "total_steps": 40000, "loss": 0.0699, "lr": 0.28394919813999125, "epoch": 0.29047467813255806, "percentage": 14.86, "elapsed_time": "6:10:19", "remaining_time": "1 day, 11:21:22", "throughput": 339.41, "total_tokens": 7541696} {"current_steps": 5950, "total_steps": 40000, "loss": 0.0824, "lr": 0.28392267666180787, "epoch": 0.2907189797962524, "percentage": 14.88, "elapsed_time": "6:10:23", "remaining_time": "1 day, 11:19:35", "throughput": 339.66, "total_tokens": 7548352} {"current_steps": 5955, "total_steps": 40000, "loss": 0.0631, "lr": 0.2838961345310648, "epoch": 0.29096328145994677, "percentage": 14.89, "elapsed_time": "6:10:26", "remaining_time": "1 day, 11:17:47", "throughput": 339.88, "total_tokens": 7554144} {"current_steps": 5960, "total_steps": 40000, "loss": 0.0679, "lr": 0.2838695717518552, "epoch": 0.2912075831236411, "percentage": 14.9, "elapsed_time": "6:10:29", "remaining_time": "1 day, 11:15:59", "throughput": 340.12, "total_tokens": 7560640} {"current_steps": 5965, "total_steps": 40000, "loss": 0.0773, "lr": 0.28384298832827526, "epoch": 0.2914518847873354, "percentage": 14.91, "elapsed_time": "6:10:32", "remaining_time": "1 day, 11:14:11", "throughput": 340.35, "total_tokens": 7566720} {"current_steps": 5970, "total_steps": 40000, "loss": 0.0675, "lr": 0.28381638426442457, "epoch": 0.29169618645102974, "percentage": 14.92, "elapsed_time": "6:10:35", "remaining_time": "1 day, 11:12:24", "throughput": 340.59, "total_tokens": 7573120} {"current_steps": 5975, "total_steps": 40000, "loss": 0.0912, "lr": 0.2837897595644057, "epoch": 0.29194048811472406, "percentage": 14.94, "elapsed_time": "6:10:38", "remaining_time": "1 day, 11:10:36", "throughput": 340.81, "total_tokens": 7578976} {"current_steps": 5980, "total_steps": 40000, "loss": 0.0769, "lr": 0.28376311423232475, "epoch": 0.2921847897784184, "percentage": 14.95, "elapsed_time": "6:10:41", "remaining_time": "1 day, 11:08:48", "throughput": 341.04, "total_tokens": 7585184} {"current_steps": 5985, "total_steps": 40000, "loss": 0.0922, "lr": 0.2837364482722905, "epoch": 0.2924290914421127, "percentage": 14.96, "elapsed_time": "6:10:44", "remaining_time": "1 day, 11:07:02", "throughput": 341.3, "total_tokens": 7591872} {"current_steps": 5990, "total_steps": 40000, "loss": 0.0988, "lr": 0.28370976168841533, "epoch": 0.29267339310580703, "percentage": 14.97, "elapsed_time": "6:10:47", "remaining_time": "1 day, 11:05:15", "throughput": 341.52, "total_tokens": 7597824} {"current_steps": 5995, "total_steps": 40000, "loss": 0.0919, "lr": 0.2836830544848146, "epoch": 0.29291769476950136, "percentage": 14.99, "elapsed_time": "6:10:50", "remaining_time": "1 day, 11:03:28", "throughput": 341.74, "total_tokens": 7603776} {"current_steps": 6000, "total_steps": 40000, "loss": 0.056, "lr": 0.2836563266656069, "epoch": 0.29316199643319574, "percentage": 15.0, "elapsed_time": "6:10:53", "remaining_time": "1 day, 11:01:42", "throughput": 341.98, "total_tokens": 7610208} {"current_steps": 6000, "total_steps": 40000, "eval_loss": 0.08778867870569229, "epoch": 0.29316199643319574, "percentage": 15.0, "elapsed_time": "6:21:32", "remaining_time": "1 day, 12:02:05", "throughput": 332.43, "total_tokens": 7610208} {"current_steps": 6005, "total_steps": 40000, "loss": 0.0497, "lr": 0.283629578234914, "epoch": 0.29340629809689006, "percentage": 15.01, "elapsed_time": "6:21:36", "remaining_time": "1 day, 12:00:20", "throughput": 332.67, "total_tokens": 7616992} {"current_steps": 6010, "total_steps": 40000, "loss": 0.1217, "lr": 0.2836028091968608, "epoch": 0.2936505997605844, "percentage": 15.02, "elapsed_time": "6:21:39", "remaining_time": "1 day, 11:58:31", "throughput": 332.91, "total_tokens": 7623616} {"current_steps": 6015, "total_steps": 40000, "loss": 0.0698, "lr": 0.28357601955557554, "epoch": 0.2938949014242787, "percentage": 15.04, "elapsed_time": "6:21:43", "remaining_time": "1 day, 11:56:43", "throughput": 333.15, "total_tokens": 7630240} {"current_steps": 6020, "total_steps": 40000, "loss": 0.0637, "lr": 0.2835492093151894, "epoch": 0.29413920308797303, "percentage": 15.05, "elapsed_time": "6:21:46", "remaining_time": "1 day, 11:54:54", "throughput": 333.39, "total_tokens": 7636768} {"current_steps": 6025, "total_steps": 40000, "loss": 0.0975, "lr": 0.2835223784798369, "epoch": 0.29438350475166736, "percentage": 15.06, "elapsed_time": "6:21:49", "remaining_time": "1 day, 11:53:05", "throughput": 333.64, "total_tokens": 7643488} {"current_steps": 6030, "total_steps": 40000, "loss": 0.0521, "lr": 0.2834955270536557, "epoch": 0.2946278064153617, "percentage": 15.07, "elapsed_time": "6:21:52", "remaining_time": "1 day, 11:51:17", "throughput": 333.88, "total_tokens": 7650080} {"current_steps": 6035, "total_steps": 40000, "loss": 0.065, "lr": 0.2834686550407866, "epoch": 0.294872108079056, "percentage": 15.09, "elapsed_time": "6:21:55", "remaining_time": "1 day, 11:49:28", "throughput": 334.12, "total_tokens": 7656544} {"current_steps": 6040, "total_steps": 40000, "loss": 0.083, "lr": 0.28344176244537367, "epoch": 0.29511640974275033, "percentage": 15.1, "elapsed_time": "6:21:58", "remaining_time": "1 day, 11:47:41", "throughput": 334.37, "total_tokens": 7663392} {"current_steps": 6045, "total_steps": 40000, "loss": 0.0695, "lr": 0.28341484927156396, "epoch": 0.29536071140644465, "percentage": 15.11, "elapsed_time": "6:22:01", "remaining_time": "1 day, 11:45:52", "throughput": 334.59, "total_tokens": 7669376} {"current_steps": 6050, "total_steps": 40000, "loss": 0.0728, "lr": 0.28338791552350795, "epoch": 0.29560501307013903, "percentage": 15.12, "elapsed_time": "6:22:05", "remaining_time": "1 day, 11:44:05", "throughput": 334.85, "total_tokens": 7676352} {"current_steps": 6055, "total_steps": 40000, "loss": 0.0827, "lr": 0.28336096120535914, "epoch": 0.29584931473383336, "percentage": 15.14, "elapsed_time": "6:22:08", "remaining_time": "1 day, 11:42:17", "throughput": 335.07, "total_tokens": 7682560} {"current_steps": 6060, "total_steps": 40000, "loss": 0.0869, "lr": 0.2833339863212741, "epoch": 0.2960936163975277, "percentage": 15.15, "elapsed_time": "6:22:11", "remaining_time": "1 day, 11:40:29", "throughput": 335.3, "total_tokens": 7688864} {"current_steps": 6065, "total_steps": 40000, "loss": 0.0697, "lr": 0.28330699087541283, "epoch": 0.296337918061222, "percentage": 15.16, "elapsed_time": "6:22:14", "remaining_time": "1 day, 11:38:41", "throughput": 335.53, "total_tokens": 7695008} {"current_steps": 6070, "total_steps": 40000, "loss": 0.0572, "lr": 0.2832799748719384, "epoch": 0.29658221972491633, "percentage": 15.17, "elapsed_time": "6:22:17", "remaining_time": "1 day, 11:36:54", "throughput": 335.76, "total_tokens": 7701504} {"current_steps": 6075, "total_steps": 40000, "loss": 0.0794, "lr": 0.28325293831501686, "epoch": 0.29682652138861065, "percentage": 15.19, "elapsed_time": "6:22:20", "remaining_time": "1 day, 11:35:08", "throughput": 336.0, "total_tokens": 7708128} {"current_steps": 6080, "total_steps": 40000, "loss": 0.0397, "lr": 0.2832258812088177, "epoch": 0.297070823052305, "percentage": 15.2, "elapsed_time": "6:22:23", "remaining_time": "1 day, 11:33:20", "throughput": 336.22, "total_tokens": 7714080} {"current_steps": 6085, "total_steps": 40000, "loss": 0.0754, "lr": 0.2831988035575134, "epoch": 0.2973151247159993, "percentage": 15.21, "elapsed_time": "6:22:26", "remaining_time": "1 day, 11:31:34", "throughput": 336.46, "total_tokens": 7720544} {"current_steps": 6090, "total_steps": 40000, "loss": 0.0532, "lr": 0.28317170536527975, "epoch": 0.2975594263796936, "percentage": 15.22, "elapsed_time": "6:22:29", "remaining_time": "1 day, 11:29:47", "throughput": 336.69, "total_tokens": 7726944} {"current_steps": 6095, "total_steps": 40000, "loss": 0.0498, "lr": 0.2831445866362956, "epoch": 0.29780372804338795, "percentage": 15.24, "elapsed_time": "6:22:32", "remaining_time": "1 day, 11:28:00", "throughput": 336.91, "total_tokens": 7732992} {"current_steps": 6100, "total_steps": 40000, "loss": 0.088, "lr": 0.2831174473747429, "epoch": 0.29804802970708233, "percentage": 15.25, "elapsed_time": "6:22:35", "remaining_time": "1 day, 11:26:14", "throughput": 337.15, "total_tokens": 7739520} {"current_steps": 6105, "total_steps": 40000, "loss": 0.0829, "lr": 0.2830902875848071, "epoch": 0.29829233137077665, "percentage": 15.26, "elapsed_time": "6:22:39", "remaining_time": "1 day, 11:24:28", "throughput": 337.39, "total_tokens": 7746080} {"current_steps": 6110, "total_steps": 40000, "loss": 0.0532, "lr": 0.28306310727067635, "epoch": 0.298536633034471, "percentage": 15.28, "elapsed_time": "6:22:42", "remaining_time": "1 day, 11:22:43", "throughput": 337.63, "total_tokens": 7752736} {"current_steps": 6115, "total_steps": 40000, "loss": 0.0874, "lr": 0.2830359064365423, "epoch": 0.2987809346981653, "percentage": 15.29, "elapsed_time": "6:22:45", "remaining_time": "1 day, 11:20:57", "throughput": 337.86, "total_tokens": 7759168} {"current_steps": 6120, "total_steps": 40000, "loss": 0.0532, "lr": 0.28300868508659965, "epoch": 0.2990252363618596, "percentage": 15.3, "elapsed_time": "6:22:48", "remaining_time": "1 day, 11:19:11", "throughput": 338.1, "total_tokens": 7765504} {"current_steps": 6125, "total_steps": 40000, "loss": 0.0513, "lr": 0.28298144322504626, "epoch": 0.29926953802555395, "percentage": 15.31, "elapsed_time": "6:22:51", "remaining_time": "1 day, 11:17:26", "throughput": 338.33, "total_tokens": 7772032} {"current_steps": 6130, "total_steps": 40000, "loss": 0.0548, "lr": 0.2829541808560832, "epoch": 0.2995138396892483, "percentage": 15.32, "elapsed_time": "6:22:54", "remaining_time": "1 day, 11:15:41", "throughput": 338.57, "total_tokens": 7778496} {"current_steps": 6135, "total_steps": 40000, "loss": 0.0466, "lr": 0.2829268979839146, "epoch": 0.2997581413529426, "percentage": 15.34, "elapsed_time": "6:22:57", "remaining_time": "1 day, 11:13:56", "throughput": 338.81, "total_tokens": 7785184} {"current_steps": 6140, "total_steps": 40000, "loss": 0.0591, "lr": 0.2828995946127479, "epoch": 0.3000024430166369, "percentage": 15.35, "elapsed_time": "6:23:00", "remaining_time": "1 day, 11:12:11", "throughput": 339.03, "total_tokens": 7791296} {"current_steps": 6145, "total_steps": 40000, "loss": 0.0574, "lr": 0.2828722707467936, "epoch": 0.30024674468033125, "percentage": 15.36, "elapsed_time": "6:23:03", "remaining_time": "1 day, 11:10:26", "throughput": 339.26, "total_tokens": 7797440} {"current_steps": 6150, "total_steps": 40000, "loss": 0.0624, "lr": 0.2828449263902653, "epoch": 0.3004910463440256, "percentage": 15.38, "elapsed_time": "6:23:07", "remaining_time": "1 day, 11:08:42", "throughput": 339.49, "total_tokens": 7803904} {"current_steps": 6155, "total_steps": 40000, "loss": 0.0584, "lr": 0.28281756154738, "epoch": 0.30073534800771995, "percentage": 15.39, "elapsed_time": "6:23:10", "remaining_time": "1 day, 11:06:57", "throughput": 339.71, "total_tokens": 7810048} {"current_steps": 6160, "total_steps": 40000, "loss": 0.0687, "lr": 0.28279017622235764, "epoch": 0.3009796496714143, "percentage": 15.4, "elapsed_time": "6:23:13", "remaining_time": "1 day, 11:05:14", "throughput": 339.99, "total_tokens": 7817568} {"current_steps": 6165, "total_steps": 40000, "loss": 0.0943, "lr": 0.28276277041942127, "epoch": 0.3012239513351086, "percentage": 15.41, "elapsed_time": "6:23:16", "remaining_time": "1 day, 11:03:30", "throughput": 340.24, "total_tokens": 7824288} {"current_steps": 6170, "total_steps": 40000, "loss": 0.0796, "lr": 0.2827353441427974, "epoch": 0.3014682529988029, "percentage": 15.43, "elapsed_time": "6:23:19", "remaining_time": "1 day, 11:01:47", "throughput": 340.47, "total_tokens": 7830752} {"current_steps": 6175, "total_steps": 40000, "loss": 0.0762, "lr": 0.2827078973967153, "epoch": 0.30171255466249725, "percentage": 15.44, "elapsed_time": "6:23:22", "remaining_time": "1 day, 11:00:03", "throughput": 340.71, "total_tokens": 7837408} {"current_steps": 6180, "total_steps": 40000, "loss": 0.0911, "lr": 0.2826804301854078, "epoch": 0.30195685632619157, "percentage": 15.45, "elapsed_time": "6:23:26", "remaining_time": "1 day, 10:58:20", "throughput": 340.94, "total_tokens": 7843776} {"current_steps": 6185, "total_steps": 40000, "loss": 0.0846, "lr": 0.2826529425131105, "epoch": 0.3022011579898859, "percentage": 15.46, "elapsed_time": "6:23:29", "remaining_time": "1 day, 10:56:37", "throughput": 341.19, "total_tokens": 7850432} {"current_steps": 6190, "total_steps": 40000, "loss": 0.0907, "lr": 0.2826254343840625, "epoch": 0.3024454596535802, "percentage": 15.47, "elapsed_time": "6:23:32", "remaining_time": "1 day, 10:54:53", "throughput": 341.4, "total_tokens": 7856384} {"current_steps": 6195, "total_steps": 40000, "loss": 0.0622, "lr": 0.2825979058025059, "epoch": 0.3026897613172746, "percentage": 15.49, "elapsed_time": "6:23:35", "remaining_time": "1 day, 10:53:10", "throughput": 341.62, "total_tokens": 7862560} {"current_steps": 6200, "total_steps": 40000, "loss": 0.0573, "lr": 0.2825703567726858, "epoch": 0.3029340629809689, "percentage": 15.5, "elapsed_time": "6:23:38", "remaining_time": "1 day, 10:51:26", "throughput": 341.85, "total_tokens": 7868832} {"current_steps": 6200, "total_steps": 40000, "eval_loss": 0.08069460093975067, "epoch": 0.3029340629809689, "percentage": 15.5, "elapsed_time": "6:34:16", "remaining_time": "1 day, 11:49:28", "throughput": 332.62, "total_tokens": 7868832} {"current_steps": 6205, "total_steps": 40000, "loss": 0.0524, "lr": 0.2825427872988508, "epoch": 0.30317836464466325, "percentage": 15.51, "elapsed_time": "6:34:20", "remaining_time": "1 day, 11:47:45", "throughput": 332.83, "total_tokens": 7875072} {"current_steps": 6210, "total_steps": 40000, "loss": 0.0699, "lr": 0.28251519738525227, "epoch": 0.30342266630835757, "percentage": 15.53, "elapsed_time": "6:34:23", "remaining_time": "1 day, 11:45:59", "throughput": 333.04, "total_tokens": 7880992} {"current_steps": 6215, "total_steps": 40000, "loss": 0.079, "lr": 0.28248758703614507, "epoch": 0.3036669679720519, "percentage": 15.54, "elapsed_time": "6:34:26", "remaining_time": "1 day, 11:44:13", "throughput": 333.27, "total_tokens": 7887392} {"current_steps": 6220, "total_steps": 40000, "loss": 0.0726, "lr": 0.28245995625578696, "epoch": 0.3039112696357462, "percentage": 15.55, "elapsed_time": "6:34:29", "remaining_time": "1 day, 11:42:28", "throughput": 333.5, "total_tokens": 7894016} {"current_steps": 6225, "total_steps": 40000, "loss": 0.0728, "lr": 0.282432305048439, "epoch": 0.30415557129944054, "percentage": 15.56, "elapsed_time": "6:34:33", "remaining_time": "1 day, 11:40:42", "throughput": 333.72, "total_tokens": 7900224} {"current_steps": 6230, "total_steps": 40000, "loss": 0.0503, "lr": 0.28240463341836536, "epoch": 0.30439987296313487, "percentage": 15.57, "elapsed_time": "6:34:36", "remaining_time": "1 day, 11:38:57", "throughput": 333.94, "total_tokens": 7906464} {"current_steps": 6235, "total_steps": 40000, "loss": 0.0759, "lr": 0.2823769413698334, "epoch": 0.3046441746268292, "percentage": 15.59, "elapsed_time": "6:34:39", "remaining_time": "1 day, 11:37:11", "throughput": 334.15, "total_tokens": 7912352} {"current_steps": 6240, "total_steps": 40000, "loss": 0.0594, "lr": 0.2823492289071135, "epoch": 0.3048884762905235, "percentage": 15.6, "elapsed_time": "6:34:42", "remaining_time": "1 day, 11:35:26", "throughput": 334.38, "total_tokens": 7918944} {"current_steps": 6245, "total_steps": 40000, "loss": 0.0529, "lr": 0.2823214960344793, "epoch": 0.3051327779542179, "percentage": 15.61, "elapsed_time": "6:34:45", "remaining_time": "1 day, 11:33:41", "throughput": 334.6, "total_tokens": 7925024} {"current_steps": 6250, "total_steps": 40000, "loss": 0.0603, "lr": 0.28229374275620756, "epoch": 0.3053770796179122, "percentage": 15.62, "elapsed_time": "6:34:48", "remaining_time": "1 day, 11:31:56", "throughput": 334.82, "total_tokens": 7931232} {"current_steps": 6255, "total_steps": 40000, "loss": 0.0543, "lr": 0.28226596907657814, "epoch": 0.30562138128160654, "percentage": 15.64, "elapsed_time": "6:34:51", "remaining_time": "1 day, 11:30:11", "throughput": 335.04, "total_tokens": 7937536} {"current_steps": 6260, "total_steps": 40000, "loss": 0.0405, "lr": 0.28223817499987414, "epoch": 0.30586568294530087, "percentage": 15.65, "elapsed_time": "6:34:54", "remaining_time": "1 day, 11:28:27", "throughput": 335.26, "total_tokens": 7943648} {"current_steps": 6265, "total_steps": 40000, "loss": 0.0866, "lr": 0.2822103605303818, "epoch": 0.3061099846089952, "percentage": 15.66, "elapsed_time": "6:34:57", "remaining_time": "1 day, 11:26:42", "throughput": 335.48, "total_tokens": 7949952} {"current_steps": 6270, "total_steps": 40000, "loss": 0.0738, "lr": 0.2821825256723903, "epoch": 0.3063542862726895, "percentage": 15.68, "elapsed_time": "6:35:00", "remaining_time": "1 day, 11:24:59", "throughput": 335.72, "total_tokens": 7956672} {"current_steps": 6275, "total_steps": 40000, "loss": 0.0874, "lr": 0.2821546704301923, "epoch": 0.30659858793638384, "percentage": 15.69, "elapsed_time": "6:35:03", "remaining_time": "1 day, 11:23:15", "throughput": 335.93, "total_tokens": 7962752} {"current_steps": 6280, "total_steps": 40000, "loss": 0.0917, "lr": 0.2821267948080834, "epoch": 0.30684288960007816, "percentage": 15.7, "elapsed_time": "6:35:06", "remaining_time": "1 day, 11:21:31", "throughput": 336.15, "total_tokens": 7968992} {"current_steps": 6285, "total_steps": 40000, "loss": 0.081, "lr": 0.28209889881036226, "epoch": 0.3070871912637725, "percentage": 15.71, "elapsed_time": "6:35:09", "remaining_time": "1 day, 11:19:47", "throughput": 336.38, "total_tokens": 7975456} {"current_steps": 6290, "total_steps": 40000, "loss": 0.0762, "lr": 0.28207098244133094, "epoch": 0.3073314929274668, "percentage": 15.72, "elapsed_time": "6:35:12", "remaining_time": "1 day, 11:18:04", "throughput": 336.63, "total_tokens": 7982400} {"current_steps": 6295, "total_steps": 40000, "loss": 0.0684, "lr": 0.2820430457052943, "epoch": 0.3075757945911612, "percentage": 15.74, "elapsed_time": "6:35:16", "remaining_time": "1 day, 11:16:21", "throughput": 336.85, "total_tokens": 7988832} {"current_steps": 6300, "total_steps": 40000, "loss": 0.0543, "lr": 0.28201508860656077, "epoch": 0.3078200962548555, "percentage": 15.75, "elapsed_time": "6:35:19", "remaining_time": "1 day, 11:14:39", "throughput": 337.09, "total_tokens": 7995456} {"current_steps": 6305, "total_steps": 40000, "loss": 0.0851, "lr": 0.2819871111494415, "epoch": 0.30806439791854984, "percentage": 15.76, "elapsed_time": "6:35:22", "remaining_time": "1 day, 11:12:55", "throughput": 337.32, "total_tokens": 8001920} {"current_steps": 6310, "total_steps": 40000, "loss": 0.0835, "lr": 0.28195911333825113, "epoch": 0.30830869958224416, "percentage": 15.78, "elapsed_time": "6:35:25", "remaining_time": "1 day, 11:11:13", "throughput": 337.55, "total_tokens": 8008384} {"current_steps": 6315, "total_steps": 40000, "loss": 0.0774, "lr": 0.28193109517730713, "epoch": 0.3085530012459385, "percentage": 15.79, "elapsed_time": "6:35:28", "remaining_time": "1 day, 11:09:30", "throughput": 337.77, "total_tokens": 8014752} {"current_steps": 6320, "total_steps": 40000, "loss": 0.0895, "lr": 0.2819030566709303, "epoch": 0.3087973029096328, "percentage": 15.8, "elapsed_time": "6:35:31", "remaining_time": "1 day, 11:07:47", "throughput": 337.99, "total_tokens": 8020928} {"current_steps": 6325, "total_steps": 40000, "loss": 0.0837, "lr": 0.2818749978234445, "epoch": 0.30904160457332713, "percentage": 15.81, "elapsed_time": "6:35:34", "remaining_time": "1 day, 11:06:05", "throughput": 338.2, "total_tokens": 8027104} {"current_steps": 6330, "total_steps": 40000, "loss": 0.0668, "lr": 0.2818469186391768, "epoch": 0.30928590623702146, "percentage": 15.82, "elapsed_time": "6:35:37", "remaining_time": "1 day, 11:04:23", "throughput": 338.43, "total_tokens": 8033600} {"current_steps": 6335, "total_steps": 40000, "loss": 0.0837, "lr": 0.28181881912245743, "epoch": 0.3095302079007158, "percentage": 15.84, "elapsed_time": "6:35:40", "remaining_time": "1 day, 11:02:41", "throughput": 338.65, "total_tokens": 8039680} {"current_steps": 6340, "total_steps": 40000, "loss": 0.0691, "lr": 0.2817906992776195, "epoch": 0.30977450956441016, "percentage": 15.85, "elapsed_time": "6:35:43", "remaining_time": "1 day, 11:00:59", "throughput": 338.87, "total_tokens": 8045984} {"current_steps": 6345, "total_steps": 40000, "loss": 0.0957, "lr": 0.28176255910899967, "epoch": 0.3100188112281045, "percentage": 15.86, "elapsed_time": "6:35:46", "remaining_time": "1 day, 10:59:17", "throughput": 339.1, "total_tokens": 8052640} {"current_steps": 6350, "total_steps": 40000, "loss": 0.0875, "lr": 0.2817343986209373, "epoch": 0.3102631128917988, "percentage": 15.88, "elapsed_time": "6:35:49", "remaining_time": "1 day, 10:57:35", "throughput": 339.31, "total_tokens": 8058592} {"current_steps": 6355, "total_steps": 40000, "loss": 0.0944, "lr": 0.2817062178177753, "epoch": 0.31050741455549313, "percentage": 15.89, "elapsed_time": "6:35:52", "remaining_time": "1 day, 10:55:53", "throughput": 339.51, "total_tokens": 8064448} {"current_steps": 6360, "total_steps": 40000, "loss": 0.1311, "lr": 0.2816780167038593, "epoch": 0.31075171621918746, "percentage": 15.9, "elapsed_time": "6:35:55", "remaining_time": "1 day, 10:54:11", "throughput": 339.72, "total_tokens": 8070400} {"current_steps": 6365, "total_steps": 40000, "loss": 0.0795, "lr": 0.28164979528353834, "epoch": 0.3109960178828818, "percentage": 15.91, "elapsed_time": "6:35:58", "remaining_time": "1 day, 10:52:31", "throughput": 339.95, "total_tokens": 8076768} {"current_steps": 6370, "total_steps": 40000, "loss": 0.082, "lr": 0.28162155356116453, "epoch": 0.3112403195465761, "percentage": 15.93, "elapsed_time": "6:36:02", "remaining_time": "1 day, 10:50:50", "throughput": 340.19, "total_tokens": 8083648} {"current_steps": 6375, "total_steps": 40000, "loss": 0.057, "lr": 0.28159329154109314, "epoch": 0.31148462121027043, "percentage": 15.94, "elapsed_time": "6:36:05", "remaining_time": "1 day, 10:49:11", "throughput": 340.44, "total_tokens": 8090656} {"current_steps": 6380, "total_steps": 40000, "loss": 0.0706, "lr": 0.28156500922768246, "epoch": 0.31172892287396475, "percentage": 15.95, "elapsed_time": "6:36:08", "remaining_time": "1 day, 10:47:29", "throughput": 340.64, "total_tokens": 8096544} {"current_steps": 6385, "total_steps": 40000, "loss": 0.0875, "lr": 0.28153670662529406, "epoch": 0.3119732245376591, "percentage": 15.96, "elapsed_time": "6:36:11", "remaining_time": "1 day, 10:45:49", "throughput": 340.86, "total_tokens": 8102720} {"current_steps": 6390, "total_steps": 40000, "loss": 0.0539, "lr": 0.28150838373829246, "epoch": 0.31221752620135346, "percentage": 15.97, "elapsed_time": "6:36:14", "remaining_time": "1 day, 10:44:08", "throughput": 341.08, "total_tokens": 8108992} {"current_steps": 6395, "total_steps": 40000, "loss": 0.0803, "lr": 0.2814800405710455, "epoch": 0.3124618278650478, "percentage": 15.99, "elapsed_time": "6:36:17", "remaining_time": "1 day, 10:42:28", "throughput": 341.3, "total_tokens": 8115200} {"current_steps": 6400, "total_steps": 40000, "loss": 0.0703, "lr": 0.2814516771279239, "epoch": 0.3127061295287421, "percentage": 16.0, "elapsed_time": "6:36:20", "remaining_time": "1 day, 10:40:48", "throughput": 341.53, "total_tokens": 8121856} {"current_steps": 6400, "total_steps": 40000, "eval_loss": 0.0833856537938118, "epoch": 0.3127061295287421, "percentage": 16.0, "elapsed_time": "6:46:59", "remaining_time": "1 day, 11:36:43", "throughput": 332.6, "total_tokens": 8121856} {"current_steps": 6405, "total_steps": 40000, "loss": 0.0982, "lr": 0.28142329341330186, "epoch": 0.31295043119243643, "percentage": 16.01, "elapsed_time": "6:47:03", "remaining_time": "1 day, 11:35:04", "throughput": 332.79, "total_tokens": 8127840} {"current_steps": 6410, "total_steps": 40000, "loss": 0.0926, "lr": 0.2813948894315564, "epoch": 0.31319473285613075, "percentage": 16.02, "elapsed_time": "6:47:06", "remaining_time": "1 day, 11:33:21", "throughput": 333.01, "total_tokens": 8134400} {"current_steps": 6415, "total_steps": 40000, "loss": 0.086, "lr": 0.2813664651870677, "epoch": 0.3134390345198251, "percentage": 16.04, "elapsed_time": "6:47:09", "remaining_time": "1 day, 11:31:39", "throughput": 333.25, "total_tokens": 8141120} {"current_steps": 6420, "total_steps": 40000, "loss": 0.0673, "lr": 0.28133802068421926, "epoch": 0.3136833361835194, "percentage": 16.05, "elapsed_time": "6:47:12", "remaining_time": "1 day, 11:29:56", "throughput": 333.46, "total_tokens": 8147328} {"current_steps": 6425, "total_steps": 40000, "loss": 0.0647, "lr": 0.28130955592739754, "epoch": 0.3139276378472137, "percentage": 16.06, "elapsed_time": "6:47:15", "remaining_time": "1 day, 11:28:14", "throughput": 333.67, "total_tokens": 8153408} {"current_steps": 6430, "total_steps": 40000, "loss": 0.0597, "lr": 0.2812810709209922, "epoch": 0.31417193951090805, "percentage": 16.07, "elapsed_time": "6:47:18", "remaining_time": "1 day, 11:26:31", "throughput": 333.87, "total_tokens": 8159392} {"current_steps": 6435, "total_steps": 40000, "loss": 0.0808, "lr": 0.2812525656693959, "epoch": 0.3144162411746024, "percentage": 16.09, "elapsed_time": "6:47:22", "remaining_time": "1 day, 11:24:49", "throughput": 334.1, "total_tokens": 8166080} {"current_steps": 6440, "total_steps": 40000, "loss": 0.1068, "lr": 0.28122404017700453, "epoch": 0.31466054283829675, "percentage": 16.1, "elapsed_time": "6:47:25", "remaining_time": "1 day, 11:23:07", "throughput": 334.31, "total_tokens": 8172256} {"current_steps": 6445, "total_steps": 40000, "loss": 0.0762, "lr": 0.2811954944482171, "epoch": 0.3149048445019911, "percentage": 16.11, "elapsed_time": "6:47:28", "remaining_time": "1 day, 11:21:26", "throughput": 334.54, "total_tokens": 8178848} {"current_steps": 6450, "total_steps": 40000, "loss": 0.0739, "lr": 0.2811669284874358, "epoch": 0.3151491461656854, "percentage": 16.12, "elapsed_time": "6:47:31", "remaining_time": "1 day, 11:19:44", "throughput": 334.74, "total_tokens": 8184864} {"current_steps": 6455, "total_steps": 40000, "loss": 0.0882, "lr": 0.2811383422990657, "epoch": 0.3153934478293797, "percentage": 16.14, "elapsed_time": "6:47:34", "remaining_time": "1 day, 11:18:02", "throughput": 334.94, "total_tokens": 8190720} {"current_steps": 6460, "total_steps": 40000, "loss": 0.0902, "lr": 0.2811097358875152, "epoch": 0.31563774949307405, "percentage": 16.15, "elapsed_time": "6:47:37", "remaining_time": "1 day, 11:16:20", "throughput": 335.15, "total_tokens": 8196960} {"current_steps": 6465, "total_steps": 40000, "loss": 0.0903, "lr": 0.2810811092571959, "epoch": 0.3158820511567684, "percentage": 16.16, "elapsed_time": "6:47:40", "remaining_time": "1 day, 11:14:39", "throughput": 335.36, "total_tokens": 8203136} {"current_steps": 6470, "total_steps": 40000, "loss": 0.0781, "lr": 0.28105246241252224, "epoch": 0.3161263528204627, "percentage": 16.18, "elapsed_time": "6:47:43", "remaining_time": "1 day, 11:12:58", "throughput": 335.56, "total_tokens": 8208928} {"current_steps": 6475, "total_steps": 40000, "loss": 0.0911, "lr": 0.28102379535791194, "epoch": 0.316370654484157, "percentage": 16.19, "elapsed_time": "6:47:46", "remaining_time": "1 day, 11:11:17", "throughput": 335.77, "total_tokens": 8214976} {"current_steps": 6480, "total_steps": 40000, "loss": 0.0743, "lr": 0.2809951080977859, "epoch": 0.31661495614785135, "percentage": 16.2, "elapsed_time": "6:47:49", "remaining_time": "1 day, 11:09:36", "throughput": 335.99, "total_tokens": 8221472} {"current_steps": 6485, "total_steps": 40000, "loss": 0.0869, "lr": 0.28096640063656797, "epoch": 0.31685925781154567, "percentage": 16.21, "elapsed_time": "6:47:52", "remaining_time": "1 day, 11:07:56", "throughput": 336.2, "total_tokens": 8227680} {"current_steps": 6490, "total_steps": 40000, "loss": 0.0542, "lr": 0.2809376729786852, "epoch": 0.31710355947524005, "percentage": 16.23, "elapsed_time": "6:47:55", "remaining_time": "1 day, 11:06:16", "throughput": 336.42, "total_tokens": 8234176} {"current_steps": 6495, "total_steps": 40000, "loss": 0.0741, "lr": 0.28090892512856785, "epoch": 0.3173478611389344, "percentage": 16.24, "elapsed_time": "6:47:58", "remaining_time": "1 day, 11:04:35", "throughput": 336.63, "total_tokens": 8240288} {"current_steps": 6500, "total_steps": 40000, "loss": 0.0555, "lr": 0.2808801570906491, "epoch": 0.3175921628026287, "percentage": 16.25, "elapsed_time": "6:48:01", "remaining_time": "1 day, 11:02:55", "throughput": 336.85, "total_tokens": 8246752} {"current_steps": 6505, "total_steps": 40000, "loss": 0.0605, "lr": 0.2808513688693654, "epoch": 0.317836464466323, "percentage": 16.26, "elapsed_time": "6:48:04", "remaining_time": "1 day, 11:01:15", "throughput": 337.06, "total_tokens": 8252928} {"current_steps": 6510, "total_steps": 40000, "loss": 0.0474, "lr": 0.28082256046915627, "epoch": 0.31808076613001735, "percentage": 16.28, "elapsed_time": "6:48:07", "remaining_time": "1 day, 10:59:35", "throughput": 337.26, "total_tokens": 8258688} {"current_steps": 6515, "total_steps": 40000, "loss": 0.0761, "lr": 0.28079373189446427, "epoch": 0.31832506779371167, "percentage": 16.29, "elapsed_time": "6:48:10", "remaining_time": "1 day, 10:57:55", "throughput": 337.46, "total_tokens": 8264576} {"current_steps": 6520, "total_steps": 40000, "loss": 0.0863, "lr": 0.28076488314973513, "epoch": 0.318569369457406, "percentage": 16.3, "elapsed_time": "6:48:13", "remaining_time": "1 day, 10:56:15", "throughput": 337.66, "total_tokens": 8270656} {"current_steps": 6525, "total_steps": 40000, "loss": 0.0402, "lr": 0.28073601423941774, "epoch": 0.3188136711211003, "percentage": 16.31, "elapsed_time": "6:48:17", "remaining_time": "1 day, 10:54:36", "throughput": 337.88, "total_tokens": 8277152} {"current_steps": 6530, "total_steps": 40000, "loss": 0.1241, "lr": 0.28070712516796403, "epoch": 0.31905797278479464, "percentage": 16.32, "elapsed_time": "6:48:20", "remaining_time": "1 day, 10:52:56", "throughput": 338.08, "total_tokens": 8282944} {"current_steps": 6535, "total_steps": 40000, "loss": 0.0741, "lr": 0.28067821593982906, "epoch": 0.319302274448489, "percentage": 16.34, "elapsed_time": "6:48:23", "remaining_time": "1 day, 10:51:17", "throughput": 338.29, "total_tokens": 8289280} {"current_steps": 6540, "total_steps": 40000, "loss": 0.1065, "lr": 0.28064928655947097, "epoch": 0.31954657611218334, "percentage": 16.35, "elapsed_time": "6:48:26", "remaining_time": "1 day, 10:49:38", "throughput": 338.5, "total_tokens": 8295424} {"current_steps": 6545, "total_steps": 40000, "loss": 0.0558, "lr": 0.28062033703135103, "epoch": 0.31979087777587767, "percentage": 16.36, "elapsed_time": "6:48:29", "remaining_time": "1 day, 10:48:00", "throughput": 338.73, "total_tokens": 8302080} {"current_steps": 6550, "total_steps": 40000, "loss": 0.0459, "lr": 0.2805913673599337, "epoch": 0.320035179439572, "percentage": 16.38, "elapsed_time": "6:48:32", "remaining_time": "1 day, 10:46:22", "throughput": 338.98, "total_tokens": 8309344} {"current_steps": 6555, "total_steps": 40000, "loss": 0.0925, "lr": 0.2805623775496864, "epoch": 0.3202794811032663, "percentage": 16.39, "elapsed_time": "6:48:35", "remaining_time": "1 day, 10:44:44", "throughput": 339.21, "total_tokens": 8316032} {"current_steps": 6560, "total_steps": 40000, "loss": 0.0499, "lr": 0.2805333676050797, "epoch": 0.32052378276696064, "percentage": 16.4, "elapsed_time": "6:48:38", "remaining_time": "1 day, 10:43:06", "throughput": 339.44, "total_tokens": 8322688} {"current_steps": 6565, "total_steps": 40000, "loss": 0.0845, "lr": 0.2805043375305873, "epoch": 0.32076808443065497, "percentage": 16.41, "elapsed_time": "6:48:41", "remaining_time": "1 day, 10:41:28", "throughput": 339.65, "total_tokens": 8328768} {"current_steps": 6570, "total_steps": 40000, "loss": 0.0761, "lr": 0.2804752873306861, "epoch": 0.3210123860943493, "percentage": 16.43, "elapsed_time": "6:48:45", "remaining_time": "1 day, 10:39:50", "throughput": 339.85, "total_tokens": 8334944} {"current_steps": 6575, "total_steps": 40000, "loss": 0.085, "lr": 0.2804462170098559, "epoch": 0.3212566877580436, "percentage": 16.44, "elapsed_time": "6:48:48", "remaining_time": "1 day, 10:38:11", "throughput": 340.05, "total_tokens": 8340864} {"current_steps": 6580, "total_steps": 40000, "loss": 0.0687, "lr": 0.2804171265725797, "epoch": 0.32150098942173794, "percentage": 16.45, "elapsed_time": "6:48:51", "remaining_time": "1 day, 10:36:33", "throughput": 340.26, "total_tokens": 8347008} {"current_steps": 6585, "total_steps": 40000, "loss": 0.0556, "lr": 0.28038801602334373, "epoch": 0.3217452910854323, "percentage": 16.46, "elapsed_time": "6:48:54", "remaining_time": "1 day, 10:34:55", "throughput": 340.46, "total_tokens": 8352928} {"current_steps": 6590, "total_steps": 40000, "loss": 0.0784, "lr": 0.28035888536663717, "epoch": 0.32198959274912664, "percentage": 16.48, "elapsed_time": "6:48:57", "remaining_time": "1 day, 10:33:18", "throughput": 340.69, "total_tokens": 8359648} {"current_steps": 6595, "total_steps": 40000, "loss": 0.0597, "lr": 0.2803297346069522, "epoch": 0.32223389441282096, "percentage": 16.49, "elapsed_time": "6:49:00", "remaining_time": "1 day, 10:31:41", "throughput": 340.9, "total_tokens": 8365856} {"current_steps": 6600, "total_steps": 40000, "loss": 0.1151, "lr": 0.28030056374878437, "epoch": 0.3224781960765153, "percentage": 16.5, "elapsed_time": "6:49:03", "remaining_time": "1 day, 10:30:04", "throughput": 341.11, "total_tokens": 8372096} {"current_steps": 6600, "total_steps": 40000, "eval_loss": 0.0766669362783432, "epoch": 0.3224781960765153, "percentage": 16.5, "elapsed_time": "6:59:43", "remaining_time": "1 day, 11:24:03", "throughput": 332.44, "total_tokens": 8372096} {"current_steps": 6605, "total_steps": 40000, "loss": 0.0773, "lr": 0.2802713727966321, "epoch": 0.3227224977402096, "percentage": 16.51, "elapsed_time": "6:59:47", "remaining_time": "1 day, 11:22:27", "throughput": 332.64, "total_tokens": 8378336} {"current_steps": 6610, "total_steps": 40000, "loss": 0.0735, "lr": 0.28024216175499717, "epoch": 0.32296679940390394, "percentage": 16.53, "elapsed_time": "6:59:50", "remaining_time": "1 day, 11:20:48", "throughput": 332.86, "total_tokens": 8385056} {"current_steps": 6615, "total_steps": 40000, "loss": 0.0779, "lr": 0.2802129306283841, "epoch": 0.32321110106759826, "percentage": 16.54, "elapsed_time": "6:59:53", "remaining_time": "1 day, 11:19:09", "throughput": 333.09, "total_tokens": 8391776} {"current_steps": 6620, "total_steps": 40000, "loss": 0.0735, "lr": 0.28018367942130074, "epoch": 0.3234554027312926, "percentage": 16.55, "elapsed_time": "6:59:56", "remaining_time": "1 day, 11:17:30", "throughput": 333.31, "total_tokens": 8398368} {"current_steps": 6625, "total_steps": 40000, "loss": 0.0877, "lr": 0.28015440813825804, "epoch": 0.3236997043949869, "percentage": 16.56, "elapsed_time": "6:59:59", "remaining_time": "1 day, 11:15:50", "throughput": 333.52, "total_tokens": 8404768} {"current_steps": 6630, "total_steps": 40000, "loss": 0.0625, "lr": 0.28012511678377006, "epoch": 0.32394400605868123, "percentage": 16.57, "elapsed_time": "7:00:03", "remaining_time": "1 day, 11:14:11", "throughput": 333.73, "total_tokens": 8411072} {"current_steps": 6635, "total_steps": 40000, "loss": 0.0368, "lr": 0.28009580536235373, "epoch": 0.3241883077223756, "percentage": 16.59, "elapsed_time": "7:00:06", "remaining_time": "1 day, 11:12:33", "throughput": 333.98, "total_tokens": 8418304} {"current_steps": 6640, "total_steps": 40000, "loss": 0.0951, "lr": 0.28006647387852934, "epoch": 0.32443260938606994, "percentage": 16.6, "elapsed_time": "7:00:09", "remaining_time": "1 day, 11:10:54", "throughput": 334.19, "total_tokens": 8424704} {"current_steps": 6645, "total_steps": 40000, "loss": 0.1106, "lr": 0.28003712233682015, "epoch": 0.32467691104976426, "percentage": 16.61, "elapsed_time": "7:00:12", "remaining_time": "1 day, 11:09:15", "throughput": 334.4, "total_tokens": 8431008} {"current_steps": 6650, "total_steps": 40000, "loss": 0.0716, "lr": 0.2800077507417526, "epoch": 0.3249212127134586, "percentage": 16.62, "elapsed_time": "7:00:15", "remaining_time": "1 day, 11:07:37", "throughput": 334.62, "total_tokens": 8437632} {"current_steps": 6655, "total_steps": 40000, "loss": 0.0541, "lr": 0.2799783590978561, "epoch": 0.3251655143771529, "percentage": 16.64, "elapsed_time": "7:00:18", "remaining_time": "1 day, 11:05:58", "throughput": 334.81, "total_tokens": 8443456} {"current_steps": 6660, "total_steps": 40000, "loss": 0.0783, "lr": 0.2799489474096632, "epoch": 0.32540981604084723, "percentage": 16.65, "elapsed_time": "7:00:21", "remaining_time": "1 day, 11:04:20", "throughput": 335.03, "total_tokens": 8450112} {"current_steps": 6665, "total_steps": 40000, "loss": 0.0824, "lr": 0.27991951568170953, "epoch": 0.32565411770454156, "percentage": 16.66, "elapsed_time": "7:00:24", "remaining_time": "1 day, 11:02:41", "throughput": 335.24, "total_tokens": 8456256} {"current_steps": 6670, "total_steps": 40000, "loss": 0.0866, "lr": 0.2798900639185339, "epoch": 0.3258984193682359, "percentage": 16.68, "elapsed_time": "7:00:27", "remaining_time": "1 day, 11:01:04", "throughput": 335.46, "total_tokens": 8462976} {"current_steps": 6675, "total_steps": 40000, "loss": 0.069, "lr": 0.2798605921246781, "epoch": 0.3261427210319302, "percentage": 16.69, "elapsed_time": "7:00:31", "remaining_time": "1 day, 10:59:26", "throughput": 335.66, "total_tokens": 8469152} {"current_steps": 6680, "total_steps": 40000, "loss": 0.0561, "lr": 0.2798311003046871, "epoch": 0.3263870226956246, "percentage": 16.7, "elapsed_time": "7:00:34", "remaining_time": "1 day, 10:57:48", "throughput": 335.87, "total_tokens": 8475360} {"current_steps": 6685, "total_steps": 40000, "loss": 0.0534, "lr": 0.2798015884631089, "epoch": 0.3266313243593189, "percentage": 16.71, "elapsed_time": "7:00:37", "remaining_time": "1 day, 10:56:10", "throughput": 336.07, "total_tokens": 8481504} {"current_steps": 6690, "total_steps": 40000, "loss": 0.0696, "lr": 0.27977205660449445, "epoch": 0.32687562602301323, "percentage": 16.73, "elapsed_time": "7:00:40", "remaining_time": "1 day, 10:54:33", "throughput": 336.29, "total_tokens": 8488160} {"current_steps": 6695, "total_steps": 40000, "loss": 0.0272, "lr": 0.2797425047333981, "epoch": 0.32711992768670756, "percentage": 16.74, "elapsed_time": "7:00:43", "remaining_time": "1 day, 10:52:55", "throughput": 336.5, "total_tokens": 8494304} {"current_steps": 6700, "total_steps": 40000, "loss": 0.1103, "lr": 0.27971293285437715, "epoch": 0.3273642293504019, "percentage": 16.75, "elapsed_time": "7:00:46", "remaining_time": "1 day, 10:51:18", "throughput": 336.7, "total_tokens": 8500576} {"current_steps": 6705, "total_steps": 40000, "loss": 0.092, "lr": 0.2796833409719918, "epoch": 0.3276085310140962, "percentage": 16.76, "elapsed_time": "7:00:49", "remaining_time": "1 day, 10:49:41", "throughput": 336.91, "total_tokens": 8506880} {"current_steps": 6710, "total_steps": 40000, "loss": 0.0895, "lr": 0.27965372909080566, "epoch": 0.32785283267779053, "percentage": 16.78, "elapsed_time": "7:00:52", "remaining_time": "1 day, 10:48:04", "throughput": 337.11, "total_tokens": 8512928} {"current_steps": 6715, "total_steps": 40000, "loss": 0.0654, "lr": 0.27962409721538506, "epoch": 0.32809713434148485, "percentage": 16.79, "elapsed_time": "7:00:55", "remaining_time": "1 day, 10:46:28", "throughput": 337.34, "total_tokens": 8519808} {"current_steps": 6720, "total_steps": 40000, "loss": 0.0685, "lr": 0.27959444535029976, "epoch": 0.3283414360051792, "percentage": 16.8, "elapsed_time": "7:00:59", "remaining_time": "1 day, 10:44:52", "throughput": 337.58, "total_tokens": 8526848} {"current_steps": 6725, "total_steps": 40000, "loss": 0.0688, "lr": 0.27956477350012243, "epoch": 0.3285857376688735, "percentage": 16.81, "elapsed_time": "7:01:02", "remaining_time": "1 day, 10:43:16", "throughput": 337.8, "total_tokens": 8533536} {"current_steps": 6730, "total_steps": 40000, "loss": 0.0796, "lr": 0.27953508166942875, "epoch": 0.3288300393325679, "percentage": 16.83, "elapsed_time": "7:01:05", "remaining_time": "1 day, 10:41:39", "throughput": 338.0, "total_tokens": 8539776} {"current_steps": 6735, "total_steps": 40000, "loss": 0.0612, "lr": 0.27950536986279767, "epoch": 0.3290743409962622, "percentage": 16.84, "elapsed_time": "7:01:08", "remaining_time": "1 day, 10:40:03", "throughput": 338.22, "total_tokens": 8546176} {"current_steps": 6740, "total_steps": 40000, "loss": 0.0819, "lr": 0.2794756380848111, "epoch": 0.32931864265995653, "percentage": 16.85, "elapsed_time": "7:01:11", "remaining_time": "1 day, 10:38:27", "throughput": 338.42, "total_tokens": 8552384} {"current_steps": 6745, "total_steps": 40000, "loss": 0.0723, "lr": 0.279445886340054, "epoch": 0.32956294432365085, "percentage": 16.86, "elapsed_time": "7:01:14", "remaining_time": "1 day, 10:36:52", "throughput": 338.64, "total_tokens": 8559008} {"current_steps": 6750, "total_steps": 40000, "loss": 0.047, "lr": 0.27941611463311455, "epoch": 0.3298072459873452, "percentage": 16.88, "elapsed_time": "7:01:17", "remaining_time": "1 day, 10:35:15", "throughput": 338.83, "total_tokens": 8564800} {"current_steps": 6755, "total_steps": 40000, "loss": 0.0757, "lr": 0.2793863229685839, "epoch": 0.3300515476510395, "percentage": 16.89, "elapsed_time": "7:01:20", "remaining_time": "1 day, 10:33:39", "throughput": 339.03, "total_tokens": 8570784} {"current_steps": 6760, "total_steps": 40000, "loss": 0.0653, "lr": 0.27935651135105627, "epoch": 0.3302958493147338, "percentage": 16.9, "elapsed_time": "7:01:23", "remaining_time": "1 day, 10:32:04", "throughput": 339.25, "total_tokens": 8577472} {"current_steps": 6765, "total_steps": 40000, "loss": 0.101, "lr": 0.279326679785129, "epoch": 0.33054015097842815, "percentage": 16.91, "elapsed_time": "7:01:26", "remaining_time": "1 day, 10:30:29", "throughput": 339.46, "total_tokens": 8583872} {"current_steps": 6770, "total_steps": 40000, "loss": 0.0506, "lr": 0.2792968282754024, "epoch": 0.3307844526421225, "percentage": 16.93, "elapsed_time": "7:01:29", "remaining_time": "1 day, 10:28:53", "throughput": 339.66, "total_tokens": 8589920} {"current_steps": 6775, "total_steps": 40000, "loss": 0.0605, "lr": 0.2792669568264801, "epoch": 0.3310287543058168, "percentage": 16.94, "elapsed_time": "7:01:33", "remaining_time": "1 day, 10:27:18", "throughput": 339.87, "total_tokens": 8596256} {"current_steps": 6780, "total_steps": 40000, "loss": 0.1266, "lr": 0.27923706544296856, "epoch": 0.3312730559695112, "percentage": 16.95, "elapsed_time": "7:01:36", "remaining_time": "1 day, 10:25:43", "throughput": 340.07, "total_tokens": 8602496} {"current_steps": 6785, "total_steps": 40000, "loss": 0.0862, "lr": 0.2792071541294775, "epoch": 0.3315173576332055, "percentage": 16.96, "elapsed_time": "7:01:39", "remaining_time": "1 day, 10:24:08", "throughput": 340.28, "total_tokens": 8608928} {"current_steps": 6790, "total_steps": 40000, "loss": 0.0822, "lr": 0.27917722289061947, "epoch": 0.3317616592968998, "percentage": 16.98, "elapsed_time": "7:01:42", "remaining_time": "1 day, 10:22:33", "throughput": 340.5, "total_tokens": 8615328} {"current_steps": 6795, "total_steps": 40000, "loss": 0.0738, "lr": 0.27914727173101034, "epoch": 0.33200596096059415, "percentage": 16.99, "elapsed_time": "7:01:45", "remaining_time": "1 day, 10:20:59", "throughput": 340.71, "total_tokens": 8621792} {"current_steps": 6800, "total_steps": 40000, "loss": 0.049, "lr": 0.279117300655269, "epoch": 0.3322502626242885, "percentage": 17.0, "elapsed_time": "7:01:48", "remaining_time": "1 day, 10:19:24", "throughput": 340.92, "total_tokens": 8628064} {"current_steps": 6800, "total_steps": 40000, "eval_loss": 0.07683897018432617, "epoch": 0.3322502626242885, "percentage": 17.0, "elapsed_time": "7:12:27", "remaining_time": "1 day, 11:11:23", "throughput": 332.52, "total_tokens": 8628064} {"current_steps": 6805, "total_steps": 40000, "loss": 0.0629, "lr": 0.2790873096680173, "epoch": 0.3324945642879828, "percentage": 17.01, "elapsed_time": "7:12:31", "remaining_time": "1 day, 11:09:51", "throughput": 332.71, "total_tokens": 8634304} {"current_steps": 6810, "total_steps": 40000, "loss": 0.063, "lr": 0.2790572987738802, "epoch": 0.3327388659516771, "percentage": 17.03, "elapsed_time": "7:12:34", "remaining_time": "1 day, 11:08:14", "throughput": 332.92, "total_tokens": 8640800} {"current_steps": 6815, "total_steps": 40000, "loss": 0.0706, "lr": 0.27902726797748584, "epoch": 0.33298316761537144, "percentage": 17.04, "elapsed_time": "7:12:37", "remaining_time": "1 day, 11:06:37", "throughput": 333.12, "total_tokens": 8647008} {"current_steps": 6820, "total_steps": 40000, "loss": 0.0555, "lr": 0.2789972172834652, "epoch": 0.33322746927906577, "percentage": 17.05, "elapsed_time": "7:12:40", "remaining_time": "1 day, 11:05:01", "throughput": 333.32, "total_tokens": 8653280} {"current_steps": 6825, "total_steps": 40000, "loss": 0.05, "lr": 0.2789671466964527, "epoch": 0.3334717709427601, "percentage": 17.06, "elapsed_time": "7:12:43", "remaining_time": "1 day, 11:03:24", "throughput": 333.53, "total_tokens": 8659776} {"current_steps": 6830, "total_steps": 40000, "loss": 0.0477, "lr": 0.2789370562210854, "epoch": 0.3337160726064545, "percentage": 17.08, "elapsed_time": "7:12:46", "remaining_time": "1 day, 11:01:48", "throughput": 333.74, "total_tokens": 8666208} {"current_steps": 6835, "total_steps": 40000, "loss": 0.0875, "lr": 0.27890694586200376, "epoch": 0.3339603742701488, "percentage": 17.09, "elapsed_time": "7:12:49", "remaining_time": "1 day, 11:00:12", "throughput": 333.94, "total_tokens": 8672416} {"current_steps": 6840, "total_steps": 40000, "loss": 0.0854, "lr": 0.2788768156238511, "epoch": 0.3342046759338431, "percentage": 17.1, "elapsed_time": "7:12:52", "remaining_time": "1 day, 10:58:35", "throughput": 334.13, "total_tokens": 8678432} {"current_steps": 6845, "total_steps": 40000, "loss": 0.0691, "lr": 0.27884666551127385, "epoch": 0.33444897759753744, "percentage": 17.11, "elapsed_time": "7:12:56", "remaining_time": "1 day, 10:56:59", "throughput": 334.33, "total_tokens": 8684608} {"current_steps": 6850, "total_steps": 40000, "loss": 0.0681, "lr": 0.2788164955289217, "epoch": 0.33469327926123177, "percentage": 17.12, "elapsed_time": "7:12:59", "remaining_time": "1 day, 10:55:24", "throughput": 334.56, "total_tokens": 8691744} {"current_steps": 6855, "total_steps": 40000, "loss": 0.0547, "lr": 0.27878630568144697, "epoch": 0.3349375809249261, "percentage": 17.14, "elapsed_time": "7:13:02", "remaining_time": "1 day, 10:53:48", "throughput": 334.77, "total_tokens": 8698176} {"current_steps": 6860, "total_steps": 40000, "loss": 0.0847, "lr": 0.2787560959735056, "epoch": 0.3351818825886204, "percentage": 17.15, "elapsed_time": "7:13:05", "remaining_time": "1 day, 10:52:12", "throughput": 334.97, "total_tokens": 8704320} {"current_steps": 6865, "total_steps": 40000, "loss": 0.0744, "lr": 0.27872586640975616, "epoch": 0.33542618425231474, "percentage": 17.16, "elapsed_time": "7:13:08", "remaining_time": "1 day, 10:50:37", "throughput": 335.17, "total_tokens": 8710432} {"current_steps": 6870, "total_steps": 40000, "loss": 0.0758, "lr": 0.27869561699486045, "epoch": 0.33567048591600906, "percentage": 17.18, "elapsed_time": "7:13:11", "remaining_time": "1 day, 10:49:01", "throughput": 335.35, "total_tokens": 8716320} {"current_steps": 6875, "total_steps": 40000, "loss": 0.0817, "lr": 0.2786653477334833, "epoch": 0.33591478757970344, "percentage": 17.19, "elapsed_time": "7:13:14", "remaining_time": "1 day, 10:47:26", "throughput": 335.57, "total_tokens": 8723008} {"current_steps": 6880, "total_steps": 40000, "loss": 0.0424, "lr": 0.2786350586302926, "epoch": 0.33615908924339777, "percentage": 17.2, "elapsed_time": "7:13:17", "remaining_time": "1 day, 10:45:52", "throughput": 335.78, "total_tokens": 8729600} {"current_steps": 6885, "total_steps": 40000, "loss": 0.0697, "lr": 0.27860474968995935, "epoch": 0.3364033909070921, "percentage": 17.21, "elapsed_time": "7:13:20", "remaining_time": "1 day, 10:44:17", "throughput": 335.99, "total_tokens": 8736160} {"current_steps": 6890, "total_steps": 40000, "loss": 0.0753, "lr": 0.27857442091715756, "epoch": 0.3366476925707864, "percentage": 17.22, "elapsed_time": "7:13:24", "remaining_time": "1 day, 10:42:42", "throughput": 336.2, "total_tokens": 8742688} {"current_steps": 6895, "total_steps": 40000, "loss": 0.0649, "lr": 0.27854407231656425, "epoch": 0.33689199423448074, "percentage": 17.24, "elapsed_time": "7:13:27", "remaining_time": "1 day, 10:41:08", "throughput": 336.43, "total_tokens": 8749696} {"current_steps": 6900, "total_steps": 40000, "loss": 0.0962, "lr": 0.2785137038928596, "epoch": 0.33713629589817506, "percentage": 17.25, "elapsed_time": "7:13:30", "remaining_time": "1 day, 10:39:34", "throughput": 336.63, "total_tokens": 8755904} {"current_steps": 6905, "total_steps": 40000, "loss": 0.0675, "lr": 0.27848331565072687, "epoch": 0.3373805975618694, "percentage": 17.26, "elapsed_time": "7:13:33", "remaining_time": "1 day, 10:37:59", "throughput": 336.83, "total_tokens": 8762144} {"current_steps": 6910, "total_steps": 40000, "loss": 0.0664, "lr": 0.27845290759485225, "epoch": 0.3376248992255637, "percentage": 17.27, "elapsed_time": "7:13:36", "remaining_time": "1 day, 10:36:25", "throughput": 337.03, "total_tokens": 8768320} {"current_steps": 6915, "total_steps": 40000, "loss": 0.0671, "lr": 0.278422479729925, "epoch": 0.33786920088925804, "percentage": 17.29, "elapsed_time": "7:13:39", "remaining_time": "1 day, 10:34:51", "throughput": 337.24, "total_tokens": 8774848} {"current_steps": 6920, "total_steps": 40000, "loss": 0.0652, "lr": 0.2783920320606375, "epoch": 0.33811350255295236, "percentage": 17.3, "elapsed_time": "7:13:42", "remaining_time": "1 day, 10:33:17", "throughput": 337.43, "total_tokens": 8780928} {"current_steps": 6925, "total_steps": 40000, "loss": 0.0643, "lr": 0.2783615645916852, "epoch": 0.33835780421664674, "percentage": 17.31, "elapsed_time": "7:13:45", "remaining_time": "1 day, 10:31:43", "throughput": 337.63, "total_tokens": 8787200} {"current_steps": 6930, "total_steps": 40000, "loss": 0.0671, "lr": 0.2783310773277666, "epoch": 0.33860210588034106, "percentage": 17.32, "elapsed_time": "7:13:48", "remaining_time": "1 day, 10:30:10", "throughput": 337.84, "total_tokens": 8793568} {"current_steps": 6935, "total_steps": 40000, "loss": 0.0519, "lr": 0.2783005702735831, "epoch": 0.3388464075440354, "percentage": 17.34, "elapsed_time": "7:13:52", "remaining_time": "1 day, 10:28:36", "throughput": 338.04, "total_tokens": 8799968} {"current_steps": 6940, "total_steps": 40000, "loss": 0.0904, "lr": 0.2782700434338394, "epoch": 0.3390907092077297, "percentage": 17.35, "elapsed_time": "7:13:55", "remaining_time": "1 day, 10:27:03", "throughput": 338.27, "total_tokens": 8807008} {"current_steps": 6945, "total_steps": 40000, "loss": 0.0868, "lr": 0.278239496813243, "epoch": 0.33933501087142404, "percentage": 17.36, "elapsed_time": "7:13:58", "remaining_time": "1 day, 10:25:30", "throughput": 338.47, "total_tokens": 8813248} {"current_steps": 6950, "total_steps": 40000, "loss": 0.0858, "lr": 0.27820893041650463, "epoch": 0.33957931253511836, "percentage": 17.38, "elapsed_time": "7:14:01", "remaining_time": "1 day, 10:23:56", "throughput": 338.66, "total_tokens": 8819168} {"current_steps": 6955, "total_steps": 40000, "loss": 0.0628, "lr": 0.27817834424833804, "epoch": 0.3398236141988127, "percentage": 17.39, "elapsed_time": "7:14:04", "remaining_time": "1 day, 10:22:23", "throughput": 338.86, "total_tokens": 8825344} {"current_steps": 6960, "total_steps": 40000, "loss": 0.0873, "lr": 0.27814773831345996, "epoch": 0.340067915862507, "percentage": 17.4, "elapsed_time": "7:14:07", "remaining_time": "1 day, 10:20:49", "throughput": 339.05, "total_tokens": 8831392} {"current_steps": 6965, "total_steps": 40000, "loss": 0.0461, "lr": 0.2781171126165902, "epoch": 0.34031221752620133, "percentage": 17.41, "elapsed_time": "7:14:10", "remaining_time": "1 day, 10:19:17", "throughput": 339.25, "total_tokens": 8837568} {"current_steps": 6970, "total_steps": 40000, "loss": 0.0847, "lr": 0.2780864671624517, "epoch": 0.34055651918989566, "percentage": 17.42, "elapsed_time": "7:14:13", "remaining_time": "1 day, 10:17:44", "throughput": 339.46, "total_tokens": 8844224} {"current_steps": 6975, "total_steps": 40000, "loss": 0.063, "lr": 0.27805580195577034, "epoch": 0.34080082085359004, "percentage": 17.44, "elapsed_time": "7:14:16", "remaining_time": "1 day, 10:16:12", "throughput": 339.66, "total_tokens": 8850496} {"current_steps": 6980, "total_steps": 40000, "loss": 0.1096, "lr": 0.2780251170012751, "epoch": 0.34104512251728436, "percentage": 17.45, "elapsed_time": "7:14:19", "remaining_time": "1 day, 10:14:39", "throughput": 339.86, "total_tokens": 8856672} {"current_steps": 6985, "total_steps": 40000, "loss": 0.08, "lr": 0.27799441230369787, "epoch": 0.3412894241809787, "percentage": 17.46, "elapsed_time": "7:14:22", "remaining_time": "1 day, 10:13:07", "throughput": 340.08, "total_tokens": 8863456} {"current_steps": 6990, "total_steps": 40000, "loss": 0.1085, "lr": 0.27796368786777387, "epoch": 0.341533725844673, "percentage": 17.47, "elapsed_time": "7:14:25", "remaining_time": "1 day, 10:11:35", "throughput": 340.28, "total_tokens": 8869760} {"current_steps": 6995, "total_steps": 40000, "loss": 0.0704, "lr": 0.277932943698241, "epoch": 0.34177802750836733, "percentage": 17.49, "elapsed_time": "7:14:29", "remaining_time": "1 day, 10:10:03", "throughput": 340.5, "total_tokens": 8876384} {"current_steps": 7000, "total_steps": 40000, "loss": 0.0738, "lr": 0.2779021797998406, "epoch": 0.34202232917206166, "percentage": 17.5, "elapsed_time": "7:14:32", "remaining_time": "1 day, 10:08:31", "throughput": 340.69, "total_tokens": 8882496} {"current_steps": 7000, "total_steps": 40000, "eval_loss": 0.08142410218715668, "epoch": 0.34202232917206166, "percentage": 17.5, "elapsed_time": "7:25:12", "remaining_time": "1 day, 10:58:48", "throughput": 332.53, "total_tokens": 8882496} {"current_steps": 7005, "total_steps": 40000, "loss": 0.0865, "lr": 0.2778713961773167, "epoch": 0.342266630835756, "percentage": 17.51, "elapsed_time": "7:25:16", "remaining_time": "1 day, 10:57:18", "throughput": 332.7, "total_tokens": 8888576} {"current_steps": 7010, "total_steps": 40000, "loss": 0.0811, "lr": 0.2778405928354166, "epoch": 0.3425109324994503, "percentage": 17.52, "elapsed_time": "7:25:19", "remaining_time": "1 day, 10:55:44", "throughput": 332.91, "total_tokens": 8895072} {"current_steps": 7015, "total_steps": 40000, "loss": 0.0697, "lr": 0.27780976977889055, "epoch": 0.34275523416314463, "percentage": 17.54, "elapsed_time": "7:25:22", "remaining_time": "1 day, 10:54:09", "throughput": 333.1, "total_tokens": 8901152} {"current_steps": 7020, "total_steps": 40000, "loss": 0.0702, "lr": 0.27777892701249185, "epoch": 0.342999535826839, "percentage": 17.55, "elapsed_time": "7:25:25", "remaining_time": "1 day, 10:52:35", "throughput": 333.29, "total_tokens": 8907424} {"current_steps": 7025, "total_steps": 40000, "loss": 0.0804, "lr": 0.2777480645409768, "epoch": 0.34324383749053333, "percentage": 17.56, "elapsed_time": "7:25:28", "remaining_time": "1 day, 10:51:01", "throughput": 333.48, "total_tokens": 8913408} {"current_steps": 7030, "total_steps": 40000, "loss": 0.0741, "lr": 0.27771718236910486, "epoch": 0.34348813915422766, "percentage": 17.57, "elapsed_time": "7:25:31", "remaining_time": "1 day, 10:49:27", "throughput": 333.68, "total_tokens": 8919744} {"current_steps": 7035, "total_steps": 40000, "loss": 0.0692, "lr": 0.27768628050163835, "epoch": 0.343732440817922, "percentage": 17.59, "elapsed_time": "7:25:34", "remaining_time": "1 day, 10:47:54", "throughput": 333.87, "total_tokens": 8925952} {"current_steps": 7040, "total_steps": 40000, "loss": 0.0722, "lr": 0.2776553589433428, "epoch": 0.3439767424816163, "percentage": 17.6, "elapsed_time": "7:25:37", "remaining_time": "1 day, 10:46:21", "throughput": 334.08, "total_tokens": 8932608} {"current_steps": 7045, "total_steps": 40000, "loss": 0.0514, "lr": 0.27762441769898666, "epoch": 0.34422104414531063, "percentage": 17.61, "elapsed_time": "7:25:40", "remaining_time": "1 day, 10:44:48", "throughput": 334.3, "total_tokens": 8939520} {"current_steps": 7050, "total_steps": 40000, "loss": 0.0538, "lr": 0.2775934567733415, "epoch": 0.34446534580900495, "percentage": 17.62, "elapsed_time": "7:25:43", "remaining_time": "1 day, 10:43:14", "throughput": 334.48, "total_tokens": 8945344} {"current_steps": 7055, "total_steps": 40000, "loss": 0.0841, "lr": 0.2775624761711819, "epoch": 0.3447096474726993, "percentage": 17.64, "elapsed_time": "7:25:46", "remaining_time": "1 day, 10:41:41", "throughput": 334.69, "total_tokens": 8951872} {"current_steps": 7060, "total_steps": 40000, "loss": 0.0764, "lr": 0.2775314758972854, "epoch": 0.3449539491363936, "percentage": 17.65, "elapsed_time": "7:25:50", "remaining_time": "1 day, 10:40:08", "throughput": 334.9, "total_tokens": 8958720} {"current_steps": 7065, "total_steps": 40000, "loss": 0.0813, "lr": 0.2775004559564327, "epoch": 0.3451982508000879, "percentage": 17.66, "elapsed_time": "7:25:53", "remaining_time": "1 day, 10:38:35", "throughput": 335.1, "total_tokens": 8964960} {"current_steps": 7070, "total_steps": 40000, "loss": 0.0576, "lr": 0.2774694163534073, "epoch": 0.3454425524637823, "percentage": 17.68, "elapsed_time": "7:25:56", "remaining_time": "1 day, 10:37:02", "throughput": 335.29, "total_tokens": 8971200} {"current_steps": 7075, "total_steps": 40000, "loss": 0.0897, "lr": 0.27743835709299614, "epoch": 0.34568685412747663, "percentage": 17.69, "elapsed_time": "7:25:59", "remaining_time": "1 day, 10:35:30", "throughput": 335.51, "total_tokens": 8978112} {"current_steps": 7080, "total_steps": 40000, "loss": 0.0962, "lr": 0.2774072781799888, "epoch": 0.34593115579117095, "percentage": 17.7, "elapsed_time": "7:26:02", "remaining_time": "1 day, 10:33:57", "throughput": 335.69, "total_tokens": 8983936} {"current_steps": 7085, "total_steps": 40000, "loss": 0.0879, "lr": 0.27737617961917804, "epoch": 0.3461754574548653, "percentage": 17.71, "elapsed_time": "7:26:05", "remaining_time": "1 day, 10:32:25", "throughput": 335.89, "total_tokens": 8990240} {"current_steps": 7090, "total_steps": 40000, "loss": 0.078, "lr": 0.27734506141535964, "epoch": 0.3464197591185596, "percentage": 17.72, "elapsed_time": "7:26:08", "remaining_time": "1 day, 10:30:53", "throughput": 336.08, "total_tokens": 8996512} {"current_steps": 7095, "total_steps": 40000, "loss": 0.0588, "lr": 0.2773139235733325, "epoch": 0.3466640607822539, "percentage": 17.74, "elapsed_time": "7:26:11", "remaining_time": "1 day, 10:29:21", "throughput": 336.29, "total_tokens": 9002976} {"current_steps": 7100, "total_steps": 40000, "loss": 0.0755, "lr": 0.2772827660978984, "epoch": 0.34690836244594825, "percentage": 17.75, "elapsed_time": "7:26:14", "remaining_time": "1 day, 10:27:49", "throughput": 336.48, "total_tokens": 9009248} {"current_steps": 7105, "total_steps": 40000, "loss": 0.0948, "lr": 0.27725158899386226, "epoch": 0.3471526641096426, "percentage": 17.76, "elapsed_time": "7:26:17", "remaining_time": "1 day, 10:26:17", "throughput": 336.68, "total_tokens": 9015584} {"current_steps": 7110, "total_steps": 40000, "loss": 0.0726, "lr": 0.27722039226603196, "epoch": 0.3473969657733369, "percentage": 17.77, "elapsed_time": "7:26:20", "remaining_time": "1 day, 10:24:45", "throughput": 336.88, "total_tokens": 9021856} {"current_steps": 7115, "total_steps": 40000, "loss": 0.0478, "lr": 0.2771891759192184, "epoch": 0.3476412674370312, "percentage": 17.79, "elapsed_time": "7:26:23", "remaining_time": "1 day, 10:23:13", "throughput": 337.06, "total_tokens": 9027904} {"current_steps": 7120, "total_steps": 40000, "loss": 0.0834, "lr": 0.2771579399582355, "epoch": 0.3478855691007256, "percentage": 17.8, "elapsed_time": "7:26:27", "remaining_time": "1 day, 10:21:41", "throughput": 337.25, "total_tokens": 9033952} {"current_steps": 7125, "total_steps": 40000, "loss": 0.0782, "lr": 0.2771266843879004, "epoch": 0.3481298707644199, "percentage": 17.81, "elapsed_time": "7:26:30", "remaining_time": "1 day, 10:20:10", "throughput": 337.44, "total_tokens": 9040064} {"current_steps": 7130, "total_steps": 40000, "loss": 0.0739, "lr": 0.2770954092130329, "epoch": 0.34837417242811425, "percentage": 17.82, "elapsed_time": "7:26:33", "remaining_time": "1 day, 10:18:40", "throughput": 337.67, "total_tokens": 9047296} {"current_steps": 7135, "total_steps": 40000, "loss": 0.0575, "lr": 0.27706411443845613, "epoch": 0.3486184740918086, "percentage": 17.84, "elapsed_time": "7:26:36", "remaining_time": "1 day, 10:17:09", "throughput": 337.86, "total_tokens": 9053568} {"current_steps": 7140, "total_steps": 40000, "loss": 0.0612, "lr": 0.27703280006899617, "epoch": 0.3488627757555029, "percentage": 17.85, "elapsed_time": "7:26:39", "remaining_time": "1 day, 10:15:37", "throughput": 338.05, "total_tokens": 9059488} {"current_steps": 7145, "total_steps": 40000, "loss": 0.0567, "lr": 0.277001466109482, "epoch": 0.3491070774191972, "percentage": 17.86, "elapsed_time": "7:26:42", "remaining_time": "1 day, 10:14:07", "throughput": 338.25, "total_tokens": 9066080} {"current_steps": 7150, "total_steps": 40000, "loss": 0.0737, "lr": 0.2769701125647458, "epoch": 0.34935137908289154, "percentage": 17.88, "elapsed_time": "7:26:45", "remaining_time": "1 day, 10:12:35", "throughput": 338.44, "total_tokens": 9072000} {"current_steps": 7155, "total_steps": 40000, "loss": 0.1033, "lr": 0.27693873943962266, "epoch": 0.34959568074658587, "percentage": 17.89, "elapsed_time": "7:26:48", "remaining_time": "1 day, 10:11:05", "throughput": 338.63, "total_tokens": 9078304} {"current_steps": 7160, "total_steps": 40000, "loss": 0.0624, "lr": 0.2769073467389506, "epoch": 0.3498399824102802, "percentage": 17.9, "elapsed_time": "7:26:51", "remaining_time": "1 day, 10:09:34", "throughput": 338.83, "total_tokens": 9084672} {"current_steps": 7165, "total_steps": 40000, "loss": 0.0672, "lr": 0.2768759344675709, "epoch": 0.3500842840739745, "percentage": 17.91, "elapsed_time": "7:26:54", "remaining_time": "1 day, 10:08:04", "throughput": 339.01, "total_tokens": 9090624} {"current_steps": 7170, "total_steps": 40000, "loss": 0.0564, "lr": 0.27684450263032767, "epoch": 0.3503285857376689, "percentage": 17.93, "elapsed_time": "7:26:57", "remaining_time": "1 day, 10:06:33", "throughput": 339.21, "total_tokens": 9096768} {"current_steps": 7175, "total_steps": 40000, "loss": 0.0687, "lr": 0.2768130512320682, "epoch": 0.3505728874013632, "percentage": 17.94, "elapsed_time": "7:27:01", "remaining_time": "1 day, 10:05:03", "throughput": 339.41, "total_tokens": 9103424} {"current_steps": 7180, "total_steps": 40000, "loss": 0.0603, "lr": 0.27678158027764244, "epoch": 0.35081718906505754, "percentage": 17.95, "elapsed_time": "7:27:04", "remaining_time": "1 day, 10:03:33", "throughput": 339.61, "total_tokens": 9109792} {"current_steps": 7185, "total_steps": 40000, "loss": 0.0558, "lr": 0.27675008977190385, "epoch": 0.35106149072875187, "percentage": 17.96, "elapsed_time": "7:27:07", "remaining_time": "1 day, 10:02:04", "throughput": 339.81, "total_tokens": 9116128} {"current_steps": 7190, "total_steps": 40000, "loss": 0.0718, "lr": 0.2767185797197086, "epoch": 0.3513057923924462, "percentage": 17.97, "elapsed_time": "7:27:10", "remaining_time": "1 day, 10:00:34", "throughput": 340.0, "total_tokens": 9122304} {"current_steps": 7195, "total_steps": 40000, "loss": 0.0774, "lr": 0.2766870501259159, "epoch": 0.3515500940561405, "percentage": 17.99, "elapsed_time": "7:27:13", "remaining_time": "1 day, 9:59:04", "throughput": 340.21, "total_tokens": 9128896} {"current_steps": 7200, "total_steps": 40000, "loss": 0.0668, "lr": 0.276655500995388, "epoch": 0.35179439571983484, "percentage": 18.0, "elapsed_time": "7:27:16", "remaining_time": "1 day, 9:57:35", "throughput": 340.42, "total_tokens": 9135616} {"current_steps": 7200, "total_steps": 40000, "eval_loss": 0.07512001693248749, "epoch": 0.35179439571983484, "percentage": 18.0, "elapsed_time": "7:37:55", "remaining_time": "1 day, 10:46:05", "throughput": 332.5, "total_tokens": 9135616} {"current_steps": 7205, "total_steps": 40000, "loss": 0.0808, "lr": 0.27662393233299015, "epoch": 0.35203869738352916, "percentage": 18.01, "elapsed_time": "7:37:59", "remaining_time": "1 day, 10:44:36", "throughput": 332.68, "total_tokens": 9141888} {"current_steps": 7210, "total_steps": 40000, "loss": 0.0775, "lr": 0.27659234414359074, "epoch": 0.3522829990472235, "percentage": 18.02, "elapsed_time": "7:38:02", "remaining_time": "1 day, 10:43:04", "throughput": 332.87, "total_tokens": 9148000} {"current_steps": 7215, "total_steps": 40000, "loss": 0.0906, "lr": 0.27656073643206097, "epoch": 0.35252730071091787, "percentage": 18.04, "elapsed_time": "7:38:05", "remaining_time": "1 day, 10:41:32", "throughput": 333.06, "total_tokens": 9154304} {"current_steps": 7220, "total_steps": 40000, "loss": 0.0996, "lr": 0.27652910920327517, "epoch": 0.3527716023746122, "percentage": 18.05, "elapsed_time": "7:38:08", "remaining_time": "1 day, 10:40:00", "throughput": 333.23, "total_tokens": 9160000} {"current_steps": 7225, "total_steps": 40000, "loss": 0.0856, "lr": 0.2764974624621107, "epoch": 0.3530159040383065, "percentage": 18.06, "elapsed_time": "7:38:11", "remaining_time": "1 day, 10:38:30", "throughput": 333.46, "total_tokens": 9167360} {"current_steps": 7230, "total_steps": 40000, "loss": 0.061, "lr": 0.2764657962134479, "epoch": 0.35326020570200084, "percentage": 18.07, "elapsed_time": "7:38:14", "remaining_time": "1 day, 10:36:59", "throughput": 333.66, "total_tokens": 9173888} {"current_steps": 7235, "total_steps": 40000, "loss": 0.0902, "lr": 0.27643411046217, "epoch": 0.35350450736569516, "percentage": 18.09, "elapsed_time": "7:38:17", "remaining_time": "1 day, 10:35:27", "throughput": 333.84, "total_tokens": 9179648} {"current_steps": 7240, "total_steps": 40000, "loss": 0.0768, "lr": 0.27640240521316334, "epoch": 0.3537488090293895, "percentage": 18.1, "elapsed_time": "7:38:20", "remaining_time": "1 day, 10:33:55", "throughput": 334.01, "total_tokens": 9185568} {"current_steps": 7245, "total_steps": 40000, "loss": 0.0669, "lr": 0.2763706804713174, "epoch": 0.3539931106930838, "percentage": 18.11, "elapsed_time": "7:38:23", "remaining_time": "1 day, 10:32:25", "throughput": 334.21, "total_tokens": 9192032} {"current_steps": 7250, "total_steps": 40000, "loss": 0.0727, "lr": 0.2763389362415245, "epoch": 0.35423741235677814, "percentage": 18.12, "elapsed_time": "7:38:26", "remaining_time": "1 day, 10:30:54", "throughput": 334.4, "total_tokens": 9198304} {"current_steps": 7255, "total_steps": 40000, "loss": 0.0528, "lr": 0.27630717252867987, "epoch": 0.35448171402047246, "percentage": 18.14, "elapsed_time": "7:38:29", "remaining_time": "1 day, 10:29:24", "throughput": 334.62, "total_tokens": 9205344} {"current_steps": 7260, "total_steps": 40000, "loss": 0.0678, "lr": 0.276275389337682, "epoch": 0.3547260156841668, "percentage": 18.15, "elapsed_time": "7:38:32", "remaining_time": "1 day, 10:27:53", "throughput": 334.81, "total_tokens": 9211616} {"current_steps": 7265, "total_steps": 40000, "loss": 0.0562, "lr": 0.2762435866734322, "epoch": 0.35497031734786116, "percentage": 18.16, "elapsed_time": "7:38:35", "remaining_time": "1 day, 10:26:22", "throughput": 334.99, "total_tokens": 9217696} {"current_steps": 7270, "total_steps": 40000, "loss": 0.0688, "lr": 0.27621176454083485, "epoch": 0.3552146190115555, "percentage": 18.18, "elapsed_time": "7:38:39", "remaining_time": "1 day, 10:24:52", "throughput": 335.19, "total_tokens": 9224128} {"current_steps": 7275, "total_steps": 40000, "loss": 0.0881, "lr": 0.2761799229447973, "epoch": 0.3554589206752498, "percentage": 18.19, "elapsed_time": "7:38:42", "remaining_time": "1 day, 10:23:22", "throughput": 335.39, "total_tokens": 9230528} {"current_steps": 7280, "total_steps": 40000, "loss": 0.0529, "lr": 0.27614806189023006, "epoch": 0.35570322233894414, "percentage": 18.2, "elapsed_time": "7:38:45", "remaining_time": "1 day, 10:21:52", "throughput": 335.59, "total_tokens": 9237216} {"current_steps": 7285, "total_steps": 40000, "loss": 0.0772, "lr": 0.27611618138204636, "epoch": 0.35594752400263846, "percentage": 18.21, "elapsed_time": "7:38:48", "remaining_time": "1 day, 10:20:22", "throughput": 335.77, "total_tokens": 9243104} {"current_steps": 7290, "total_steps": 40000, "loss": 0.0797, "lr": 0.2760842814251626, "epoch": 0.3561918256663328, "percentage": 18.22, "elapsed_time": "7:38:51", "remaining_time": "1 day, 10:18:52", "throughput": 335.96, "total_tokens": 9249536} {"current_steps": 7295, "total_steps": 40000, "loss": 0.1021, "lr": 0.2760523620244982, "epoch": 0.3564361273300271, "percentage": 18.24, "elapsed_time": "7:38:54", "remaining_time": "1 day, 10:17:22", "throughput": 336.16, "total_tokens": 9256096} {"current_steps": 7300, "total_steps": 40000, "loss": 0.0756, "lr": 0.27602042318497544, "epoch": 0.35668042899372143, "percentage": 18.25, "elapsed_time": "7:38:57", "remaining_time": "1 day, 10:15:53", "throughput": 336.37, "total_tokens": 9262784} {"current_steps": 7305, "total_steps": 40000, "loss": 0.0609, "lr": 0.2759884649115198, "epoch": 0.35692473065741576, "percentage": 18.26, "elapsed_time": "7:39:00", "remaining_time": "1 day, 10:14:23", "throughput": 336.56, "total_tokens": 9268960} {"current_steps": 7310, "total_steps": 40000, "loss": 0.0711, "lr": 0.2759564872090596, "epoch": 0.3571690323211101, "percentage": 18.27, "elapsed_time": "7:39:03", "remaining_time": "1 day, 10:12:55", "throughput": 336.76, "total_tokens": 9275680} {"current_steps": 7315, "total_steps": 40000, "loss": 0.07, "lr": 0.2759244900825262, "epoch": 0.35741333398480446, "percentage": 18.29, "elapsed_time": "7:39:06", "remaining_time": "1 day, 10:11:25", "throughput": 336.95, "total_tokens": 9281824} {"current_steps": 7320, "total_steps": 40000, "loss": 0.0473, "lr": 0.2758924735368539, "epoch": 0.3576576356484988, "percentage": 18.3, "elapsed_time": "7:39:10", "remaining_time": "1 day, 10:09:56", "throughput": 337.15, "total_tokens": 9288416} {"current_steps": 7325, "total_steps": 40000, "loss": 0.0831, "lr": 0.27586043757698014, "epoch": 0.3579019373121931, "percentage": 18.31, "elapsed_time": "7:39:13", "remaining_time": "1 day, 10:08:27", "throughput": 337.33, "total_tokens": 9294528} {"current_steps": 7330, "total_steps": 40000, "loss": 0.0537, "lr": 0.27582838220784534, "epoch": 0.35814623897588743, "percentage": 18.32, "elapsed_time": "7:39:16", "remaining_time": "1 day, 10:06:58", "throughput": 337.53, "total_tokens": 9300928} {"current_steps": 7335, "total_steps": 40000, "loss": 0.0622, "lr": 0.27579630743439265, "epoch": 0.35839054063958176, "percentage": 18.34, "elapsed_time": "7:39:19", "remaining_time": "1 day, 10:05:29", "throughput": 337.73, "total_tokens": 9307488} {"current_steps": 7340, "total_steps": 40000, "loss": 0.08, "lr": 0.2757642132615686, "epoch": 0.3586348423032761, "percentage": 18.35, "elapsed_time": "7:39:22", "remaining_time": "1 day, 10:04:00", "throughput": 337.9, "total_tokens": 9313184} {"current_steps": 7345, "total_steps": 40000, "loss": 0.0723, "lr": 0.2757320996943223, "epoch": 0.3588791439669704, "percentage": 18.36, "elapsed_time": "7:39:25", "remaining_time": "1 day, 10:02:31", "throughput": 338.09, "total_tokens": 9319488} {"current_steps": 7350, "total_steps": 40000, "loss": 0.0671, "lr": 0.2756999667376062, "epoch": 0.35912344563066473, "percentage": 18.38, "elapsed_time": "7:39:28", "remaining_time": "1 day, 10:01:03", "throughput": 338.28, "total_tokens": 9325696} {"current_steps": 7355, "total_steps": 40000, "loss": 0.1038, "lr": 0.2756678143963756, "epoch": 0.35936774729435905, "percentage": 18.39, "elapsed_time": "7:39:31", "remaining_time": "1 day, 9:59:34", "throughput": 338.46, "total_tokens": 9331904} {"current_steps": 7360, "total_steps": 40000, "loss": 0.0465, "lr": 0.2756356426755888, "epoch": 0.35961204895805343, "percentage": 18.4, "elapsed_time": "7:39:34", "remaining_time": "1 day, 9:58:06", "throughput": 338.65, "total_tokens": 9338112} {"current_steps": 7365, "total_steps": 40000, "loss": 0.0553, "lr": 0.27560345158020705, "epoch": 0.35985635062174776, "percentage": 18.41, "elapsed_time": "7:39:37", "remaining_time": "1 day, 9:56:38", "throughput": 338.85, "total_tokens": 9344672} {"current_steps": 7370, "total_steps": 40000, "loss": 0.0708, "lr": 0.27557124111519465, "epoch": 0.3601006522854421, "percentage": 18.43, "elapsed_time": "7:39:40", "remaining_time": "1 day, 9:55:10", "throughput": 339.04, "total_tokens": 9350944} {"current_steps": 7375, "total_steps": 40000, "loss": 0.0545, "lr": 0.27553901128551883, "epoch": 0.3603449539491364, "percentage": 18.44, "elapsed_time": "7:39:43", "remaining_time": "1 day, 9:53:43", "throughput": 339.23, "total_tokens": 9357312} {"current_steps": 7380, "total_steps": 40000, "loss": 0.0549, "lr": 0.2755067620961498, "epoch": 0.36058925561283073, "percentage": 18.45, "elapsed_time": "7:39:46", "remaining_time": "1 day, 9:52:16", "throughput": 339.44, "total_tokens": 9364096} {"current_steps": 7385, "total_steps": 40000, "loss": 0.0474, "lr": 0.27547449355206094, "epoch": 0.36083355727652505, "percentage": 18.46, "elapsed_time": "7:39:50", "remaining_time": "1 day, 9:50:48", "throughput": 339.63, "total_tokens": 9370336} {"current_steps": 7390, "total_steps": 40000, "loss": 0.0786, "lr": 0.2754422056582283, "epoch": 0.3610778589402194, "percentage": 18.48, "elapsed_time": "7:39:53", "remaining_time": "1 day, 9:49:20", "throughput": 339.82, "total_tokens": 9376768} {"current_steps": 7395, "total_steps": 40000, "loss": 0.0919, "lr": 0.27540989841963115, "epoch": 0.3613221606039137, "percentage": 18.49, "elapsed_time": "7:39:56", "remaining_time": "1 day, 9:47:52", "throughput": 340.01, "total_tokens": 9382880} {"current_steps": 7400, "total_steps": 40000, "loss": 0.0849, "lr": 0.27537757184125167, "epoch": 0.361566462267608, "percentage": 18.5, "elapsed_time": "7:39:59", "remaining_time": "1 day, 9:46:25", "throughput": 340.2, "total_tokens": 9389184} {"current_steps": 7400, "total_steps": 40000, "eval_loss": 0.08088066428899765, "epoch": 0.361566462267608, "percentage": 18.5, "elapsed_time": "7:50:38", "remaining_time": "1 day, 10:33:20", "throughput": 332.5, "total_tokens": 9389184} {"current_steps": 7405, "total_steps": 40000, "loss": 0.1033, "lr": 0.275345225928075, "epoch": 0.36181076393130235, "percentage": 18.51, "elapsed_time": "7:50:42", "remaining_time": "1 day, 10:31:54", "throughput": 332.67, "total_tokens": 9395264} {"current_steps": 7410, "total_steps": 40000, "loss": 0.1006, "lr": 0.2753128606850893, "epoch": 0.36205506559499673, "percentage": 18.52, "elapsed_time": "7:50:45", "remaining_time": "1 day, 10:30:25", "throughput": 332.86, "total_tokens": 9401664} {"current_steps": 7415, "total_steps": 40000, "loss": 0.0914, "lr": 0.2752804761172858, "epoch": 0.36229936725869105, "percentage": 18.54, "elapsed_time": "7:50:48", "remaining_time": "1 day, 10:28:56", "throughput": 333.05, "total_tokens": 9408032} {"current_steps": 7420, "total_steps": 40000, "loss": 0.0736, "lr": 0.27524807222965836, "epoch": 0.3625436689223854, "percentage": 18.55, "elapsed_time": "7:50:51", "remaining_time": "1 day, 10:27:26", "throughput": 333.23, "total_tokens": 9414240} {"current_steps": 7425, "total_steps": 40000, "loss": 0.0912, "lr": 0.27521564902720436, "epoch": 0.3627879705860797, "percentage": 18.56, "elapsed_time": "7:50:54", "remaining_time": "1 day, 10:25:57", "throughput": 333.4, "total_tokens": 9420032} {"current_steps": 7430, "total_steps": 40000, "loss": 0.066, "lr": 0.2751832065149236, "epoch": 0.363032272249774, "percentage": 18.57, "elapsed_time": "7:50:57", "remaining_time": "1 day, 10:24:28", "throughput": 333.58, "total_tokens": 9426240} {"current_steps": 7435, "total_steps": 40000, "loss": 0.065, "lr": 0.2751507446978193, "epoch": 0.36327657391346835, "percentage": 18.59, "elapsed_time": "7:51:00", "remaining_time": "1 day, 10:23:00", "throughput": 333.78, "total_tokens": 9432928} {"current_steps": 7440, "total_steps": 40000, "loss": 0.0692, "lr": 0.2751182635808974, "epoch": 0.36352087557716267, "percentage": 18.6, "elapsed_time": "7:51:03", "remaining_time": "1 day, 10:21:31", "throughput": 333.98, "total_tokens": 9439648} {"current_steps": 7445, "total_steps": 40000, "loss": 0.0718, "lr": 0.27508576316916694, "epoch": 0.363765177240857, "percentage": 18.61, "elapsed_time": "7:51:06", "remaining_time": "1 day, 10:20:03", "throughput": 334.17, "total_tokens": 9445888} {"current_steps": 7450, "total_steps": 40000, "loss": 0.0731, "lr": 0.2750532434676399, "epoch": 0.3640094789045513, "percentage": 18.62, "elapsed_time": "7:51:09", "remaining_time": "1 day, 10:18:34", "throughput": 334.36, "total_tokens": 9452192} {"current_steps": 7455, "total_steps": 40000, "loss": 0.0811, "lr": 0.27502070448133115, "epoch": 0.36425378056824564, "percentage": 18.64, "elapsed_time": "7:51:12", "remaining_time": "1 day, 10:17:06", "throughput": 334.55, "total_tokens": 9458592} {"current_steps": 7460, "total_steps": 40000, "loss": 0.0873, "lr": 0.2749881462152587, "epoch": 0.36449808223194, "percentage": 18.65, "elapsed_time": "7:51:16", "remaining_time": "1 day, 10:15:38", "throughput": 334.74, "total_tokens": 9465216} {"current_steps": 7465, "total_steps": 40000, "loss": 0.0681, "lr": 0.2749555686744434, "epoch": 0.36474238389563435, "percentage": 18.66, "elapsed_time": "7:51:19", "remaining_time": "1 day, 10:14:10", "throughput": 334.93, "total_tokens": 9471552} {"current_steps": 7470, "total_steps": 40000, "loss": 0.0632, "lr": 0.2749229718639091, "epoch": 0.36498668555932867, "percentage": 18.68, "elapsed_time": "7:51:22", "remaining_time": "1 day, 10:12:42", "throughput": 335.11, "total_tokens": 9477728} {"current_steps": 7475, "total_steps": 40000, "loss": 0.0666, "lr": 0.27489035578868265, "epoch": 0.365230987223023, "percentage": 18.69, "elapsed_time": "7:51:25", "remaining_time": "1 day, 10:11:13", "throughput": 335.29, "total_tokens": 9483776} {"current_steps": 7480, "total_steps": 40000, "loss": 0.0633, "lr": 0.2748577204537939, "epoch": 0.3654752888867173, "percentage": 18.7, "elapsed_time": "7:51:28", "remaining_time": "1 day, 10:09:46", "throughput": 335.5, "total_tokens": 9490816} {"current_steps": 7485, "total_steps": 40000, "loss": 0.0929, "lr": 0.2748250658642756, "epoch": 0.36571959055041164, "percentage": 18.71, "elapsed_time": "7:51:31", "remaining_time": "1 day, 10:08:19", "throughput": 335.69, "total_tokens": 9497152} {"current_steps": 7490, "total_steps": 40000, "loss": 0.0543, "lr": 0.2747923920251634, "epoch": 0.36596389221410597, "percentage": 18.73, "elapsed_time": "7:51:34", "remaining_time": "1 day, 10:06:51", "throughput": 335.87, "total_tokens": 9503392} {"current_steps": 7495, "total_steps": 40000, "loss": 0.0834, "lr": 0.27475969894149627, "epoch": 0.3662081938778003, "percentage": 18.74, "elapsed_time": "7:51:37", "remaining_time": "1 day, 10:05:24", "throughput": 336.06, "total_tokens": 9509632} {"current_steps": 7500, "total_steps": 40000, "loss": 0.0896, "lr": 0.2747269866183156, "epoch": 0.3664524955414946, "percentage": 18.75, "elapsed_time": "7:51:40", "remaining_time": "1 day, 10:03:56", "throughput": 336.24, "total_tokens": 9515808} {"current_steps": 7505, "total_steps": 40000, "loss": 0.0939, "lr": 0.27469425506066625, "epoch": 0.36669679720518894, "percentage": 18.76, "elapsed_time": "7:51:43", "remaining_time": "1 day, 10:02:29", "throughput": 336.43, "total_tokens": 9522112} {"current_steps": 7510, "total_steps": 40000, "loss": 0.0698, "lr": 0.27466150427359576, "epoch": 0.3669410988688833, "percentage": 18.77, "elapsed_time": "7:51:46", "remaining_time": "1 day, 10:01:02", "throughput": 336.62, "total_tokens": 9528608} {"current_steps": 7515, "total_steps": 40000, "loss": 0.0801, "lr": 0.2746287342621547, "epoch": 0.36718540053257764, "percentage": 18.79, "elapsed_time": "7:51:49", "remaining_time": "1 day, 9:59:35", "throughput": 336.81, "total_tokens": 9534944} {"current_steps": 7520, "total_steps": 40000, "loss": 0.0728, "lr": 0.2745959450313966, "epoch": 0.36742970219627197, "percentage": 18.8, "elapsed_time": "7:51:52", "remaining_time": "1 day, 9:58:08", "throughput": 336.99, "total_tokens": 9541088} {"current_steps": 7525, "total_steps": 40000, "loss": 0.0868, "lr": 0.27456313658637804, "epoch": 0.3676740038599663, "percentage": 18.81, "elapsed_time": "7:51:56", "remaining_time": "1 day, 9:56:40", "throughput": 337.17, "total_tokens": 9547168} {"current_steps": 7530, "total_steps": 40000, "loss": 0.0947, "lr": 0.27453030893215846, "epoch": 0.3679183055236606, "percentage": 18.82, "elapsed_time": "7:51:59", "remaining_time": "1 day, 9:55:14", "throughput": 337.35, "total_tokens": 9553312} {"current_steps": 7535, "total_steps": 40000, "loss": 0.0796, "lr": 0.2744974620738003, "epoch": 0.36816260718735494, "percentage": 18.84, "elapsed_time": "7:52:02", "remaining_time": "1 day, 9:53:47", "throughput": 337.53, "total_tokens": 9559712} {"current_steps": 7540, "total_steps": 40000, "loss": 0.059, "lr": 0.27446459601636897, "epoch": 0.36840690885104926, "percentage": 18.85, "elapsed_time": "7:52:05", "remaining_time": "1 day, 9:52:21", "throughput": 337.72, "total_tokens": 9566080} {"current_steps": 7545, "total_steps": 40000, "loss": 0.0637, "lr": 0.2744317107649328, "epoch": 0.3686512105147436, "percentage": 18.86, "elapsed_time": "7:52:08", "remaining_time": "1 day, 9:50:55", "throughput": 337.9, "total_tokens": 9572160} {"current_steps": 7550, "total_steps": 40000, "loss": 0.0748, "lr": 0.2743988063245631, "epoch": 0.3688955121784379, "percentage": 18.88, "elapsed_time": "7:52:11", "remaining_time": "1 day, 9:49:28", "throughput": 338.08, "total_tokens": 9578336} {"current_steps": 7555, "total_steps": 40000, "loss": 0.0741, "lr": 0.2743658827003342, "epoch": 0.3691398138421323, "percentage": 18.89, "elapsed_time": "7:52:14", "remaining_time": "1 day, 9:48:03", "throughput": 338.28, "total_tokens": 9584960} {"current_steps": 7560, "total_steps": 40000, "loss": 0.075, "lr": 0.27433293989732327, "epoch": 0.3693841155058266, "percentage": 18.9, "elapsed_time": "7:52:17", "remaining_time": "1 day, 9:46:37", "throughput": 338.47, "total_tokens": 9591392} {"current_steps": 7565, "total_steps": 40000, "loss": 0.0607, "lr": 0.27429997792061056, "epoch": 0.36962841716952094, "percentage": 18.91, "elapsed_time": "7:52:20", "remaining_time": "1 day, 9:45:10", "throughput": 338.64, "total_tokens": 9597248} {"current_steps": 7570, "total_steps": 40000, "loss": 0.0742, "lr": 0.27426699677527927, "epoch": 0.36987271883321526, "percentage": 18.93, "elapsed_time": "7:52:23", "remaining_time": "1 day, 9:43:45", "throughput": 338.84, "total_tokens": 9603904} {"current_steps": 7575, "total_steps": 40000, "loss": 0.0694, "lr": 0.2742339964664154, "epoch": 0.3701170204969096, "percentage": 18.94, "elapsed_time": "7:52:26", "remaining_time": "1 day, 9:42:19", "throughput": 339.01, "total_tokens": 9609984} {"current_steps": 7580, "total_steps": 40000, "loss": 0.1, "lr": 0.274200976999108, "epoch": 0.3703613221606039, "percentage": 18.95, "elapsed_time": "7:52:29", "remaining_time": "1 day, 9:40:54", "throughput": 339.2, "total_tokens": 9616416} {"current_steps": 7585, "total_steps": 40000, "loss": 0.0965, "lr": 0.27416793837844916, "epoch": 0.37060562382429824, "percentage": 18.96, "elapsed_time": "7:52:33", "remaining_time": "1 day, 9:39:28", "throughput": 339.4, "total_tokens": 9622912} {"current_steps": 7590, "total_steps": 40000, "loss": 0.0977, "lr": 0.27413488060953384, "epoch": 0.37084992548799256, "percentage": 18.98, "elapsed_time": "7:52:36", "remaining_time": "1 day, 9:38:03", "throughput": 339.57, "total_tokens": 9628960} {"current_steps": 7595, "total_steps": 40000, "loss": 0.0875, "lr": 0.27410180369745996, "epoch": 0.3710942271516869, "percentage": 18.99, "elapsed_time": "7:52:39", "remaining_time": "1 day, 9:36:38", "throughput": 339.75, "total_tokens": 9635008} {"current_steps": 7600, "total_steps": 40000, "loss": 0.0857, "lr": 0.27406870764732844, "epoch": 0.3713385288153812, "percentage": 19.0, "elapsed_time": "7:52:42", "remaining_time": "1 day, 9:35:12", "throughput": 339.94, "total_tokens": 9641344} {"current_steps": 7600, "total_steps": 40000, "eval_loss": 0.08132880926132202, "epoch": 0.3713385288153812, "percentage": 19.0, "elapsed_time": "8:03:21", "remaining_time": "1 day, 10:20:38", "throughput": 332.44, "total_tokens": 9641344} {"current_steps": 7605, "total_steps": 40000, "loss": 0.0938, "lr": 0.27403559246424297, "epoch": 0.3715828304790756, "percentage": 19.01, "elapsed_time": "8:03:25", "remaining_time": "1 day, 10:19:14", "throughput": 332.61, "total_tokens": 9647424} {"current_steps": 7610, "total_steps": 40000, "loss": 0.1008, "lr": 0.2740024581533105, "epoch": 0.3718271321427699, "percentage": 19.02, "elapsed_time": "8:03:28", "remaining_time": "1 day, 10:17:46", "throughput": 332.79, "total_tokens": 9653824} {"current_steps": 7615, "total_steps": 40000, "loss": 0.1035, "lr": 0.2739693047196406, "epoch": 0.37207143380646424, "percentage": 19.04, "elapsed_time": "8:03:31", "remaining_time": "1 day, 10:16:19", "throughput": 332.98, "total_tokens": 9660160} {"current_steps": 7620, "total_steps": 40000, "loss": 0.0866, "lr": 0.27393613216834606, "epoch": 0.37231573547015856, "percentage": 19.05, "elapsed_time": "8:03:34", "remaining_time": "1 day, 10:14:53", "throughput": 333.16, "total_tokens": 9666464} {"current_steps": 7625, "total_steps": 40000, "loss": 0.1017, "lr": 0.2739029405045424, "epoch": 0.3725600371338529, "percentage": 19.06, "elapsed_time": "8:03:37", "remaining_time": "1 day, 10:13:26", "throughput": 333.35, "total_tokens": 9672928} {"current_steps": 7630, "total_steps": 40000, "loss": 0.0779, "lr": 0.2738697297333483, "epoch": 0.3728043387975472, "percentage": 19.07, "elapsed_time": "8:03:40", "remaining_time": "1 day, 10:11:59", "throughput": 333.53, "total_tokens": 9679456} {"current_steps": 7635, "total_steps": 40000, "loss": 0.0713, "lr": 0.2738364998598852, "epoch": 0.37304864046124153, "percentage": 19.09, "elapsed_time": "8:03:44", "remaining_time": "1 day, 10:10:33", "throughput": 333.73, "total_tokens": 9686208} {"current_steps": 7640, "total_steps": 40000, "loss": 0.0708, "lr": 0.27380325088927765, "epoch": 0.37329294212493586, "percentage": 19.1, "elapsed_time": "8:03:47", "remaining_time": "1 day, 10:09:07", "throughput": 333.91, "total_tokens": 9692544} {"current_steps": 7645, "total_steps": 40000, "loss": 0.0602, "lr": 0.27376998282665294, "epoch": 0.3735372437886302, "percentage": 19.11, "elapsed_time": "8:03:50", "remaining_time": "1 day, 10:07:41", "throughput": 334.09, "total_tokens": 9698752} {"current_steps": 7650, "total_steps": 40000, "loss": 0.0574, "lr": 0.27373669567714154, "epoch": 0.3737815454523245, "percentage": 19.12, "elapsed_time": "8:03:53", "remaining_time": "1 day, 10:06:15", "throughput": 334.27, "total_tokens": 9705120} {"current_steps": 7655, "total_steps": 40000, "loss": 0.0772, "lr": 0.27370338944587663, "epoch": 0.3740258471160189, "percentage": 19.14, "elapsed_time": "8:03:56", "remaining_time": "1 day, 10:04:48", "throughput": 334.46, "total_tokens": 9711488} {"current_steps": 7660, "total_steps": 40000, "loss": 0.086, "lr": 0.27367006413799455, "epoch": 0.3742701487797132, "percentage": 19.15, "elapsed_time": "8:03:59", "remaining_time": "1 day, 10:03:23", "throughput": 334.66, "total_tokens": 9718368} {"current_steps": 7665, "total_steps": 40000, "loss": 0.0473, "lr": 0.2736367197586345, "epoch": 0.37451445044340753, "percentage": 19.16, "elapsed_time": "8:04:02", "remaining_time": "1 day, 10:01:57", "throughput": 334.83, "total_tokens": 9724384} {"current_steps": 7670, "total_steps": 40000, "loss": 0.0711, "lr": 0.2736033563129385, "epoch": 0.37475875210710186, "percentage": 19.18, "elapsed_time": "8:04:05", "remaining_time": "1 day, 10:00:31", "throughput": 335.0, "total_tokens": 9730400} {"current_steps": 7675, "total_steps": 40000, "loss": 0.0451, "lr": 0.27356997380605164, "epoch": 0.3750030537707962, "percentage": 19.19, "elapsed_time": "8:04:08", "remaining_time": "1 day, 9:59:05", "throughput": 335.19, "total_tokens": 9737024} {"current_steps": 7680, "total_steps": 40000, "loss": 0.0656, "lr": 0.27353657224312194, "epoch": 0.3752473554344905, "percentage": 19.2, "elapsed_time": "8:04:11", "remaining_time": "1 day, 9:57:40", "throughput": 335.37, "total_tokens": 9743008} {"current_steps": 7685, "total_steps": 40000, "loss": 0.0843, "lr": 0.2735031516293004, "epoch": 0.37549165709818483, "percentage": 19.21, "elapsed_time": "8:04:14", "remaining_time": "1 day, 9:56:14", "throughput": 335.54, "total_tokens": 9749152} {"current_steps": 7690, "total_steps": 40000, "loss": 0.076, "lr": 0.2734697119697408, "epoch": 0.37573595876187915, "percentage": 19.23, "elapsed_time": "8:04:18", "remaining_time": "1 day, 9:54:49", "throughput": 335.72, "total_tokens": 9755424} {"current_steps": 7695, "total_steps": 40000, "loss": 0.0497, "lr": 0.27343625326959997, "epoch": 0.3759802604255735, "percentage": 19.24, "elapsed_time": "8:04:21", "remaining_time": "1 day, 9:53:23", "throughput": 335.9, "total_tokens": 9761760} {"current_steps": 7700, "total_steps": 40000, "loss": 0.0639, "lr": 0.27340277553403775, "epoch": 0.37622456208926786, "percentage": 19.25, "elapsed_time": "8:04:24", "remaining_time": "1 day, 9:51:58", "throughput": 336.09, "total_tokens": 9768064} {"current_steps": 7705, "total_steps": 40000, "loss": 0.0924, "lr": 0.2733692787682167, "epoch": 0.3764688637529622, "percentage": 19.26, "elapsed_time": "8:04:27", "remaining_time": "1 day, 9:50:33", "throughput": 336.28, "total_tokens": 9774720} {"current_steps": 7710, "total_steps": 40000, "loss": 0.073, "lr": 0.27333576297730255, "epoch": 0.3767131654166565, "percentage": 19.28, "elapsed_time": "8:04:30", "remaining_time": "1 day, 9:49:09", "throughput": 336.46, "total_tokens": 9781120} {"current_steps": 7715, "total_steps": 40000, "loss": 0.0906, "lr": 0.2733022281664638, "epoch": 0.3769574670803508, "percentage": 19.29, "elapsed_time": "8:04:33", "remaining_time": "1 day, 9:47:44", "throughput": 336.64, "total_tokens": 9787264} {"current_steps": 7720, "total_steps": 40000, "loss": 0.0764, "lr": 0.273268674340872, "epoch": 0.37720176874404515, "percentage": 19.3, "elapsed_time": "8:04:36", "remaining_time": "1 day, 9:46:18", "throughput": 336.8, "total_tokens": 9793088} {"current_steps": 7725, "total_steps": 40000, "loss": 0.0595, "lr": 0.27323510150570146, "epoch": 0.3774460704077395, "percentage": 19.31, "elapsed_time": "8:04:39", "remaining_time": "1 day, 9:44:54", "throughput": 337.01, "total_tokens": 9800064} {"current_steps": 7730, "total_steps": 40000, "loss": 0.0496, "lr": 0.27320150966612966, "epoch": 0.3776903720714338, "percentage": 19.32, "elapsed_time": "8:04:42", "remaining_time": "1 day, 9:43:30", "throughput": 337.2, "total_tokens": 9806688} {"current_steps": 7735, "total_steps": 40000, "loss": 0.0652, "lr": 0.2731678988273368, "epoch": 0.3779346737351281, "percentage": 19.34, "elapsed_time": "8:04:45", "remaining_time": "1 day, 9:42:06", "throughput": 337.38, "total_tokens": 9812960} {"current_steps": 7740, "total_steps": 40000, "loss": 0.0745, "lr": 0.27313426899450605, "epoch": 0.37817897539882245, "percentage": 19.35, "elapsed_time": "8:04:49", "remaining_time": "1 day, 9:40:41", "throughput": 337.55, "total_tokens": 9819072} {"current_steps": 7745, "total_steps": 40000, "loss": 0.0612, "lr": 0.27310062017282366, "epoch": 0.37842327706251677, "percentage": 19.36, "elapsed_time": "8:04:52", "remaining_time": "1 day, 9:39:17", "throughput": 337.73, "total_tokens": 9825312} {"current_steps": 7750, "total_steps": 40000, "loss": 0.0604, "lr": 0.2730669523674787, "epoch": 0.37866757872621115, "percentage": 19.38, "elapsed_time": "8:04:55", "remaining_time": "1 day, 9:37:53", "throughput": 337.91, "total_tokens": 9831616} {"current_steps": 7755, "total_steps": 40000, "loss": 0.0665, "lr": 0.2730332655836631, "epoch": 0.3789118803899055, "percentage": 19.39, "elapsed_time": "8:04:58", "remaining_time": "1 day, 9:36:29", "throughput": 338.09, "total_tokens": 9837792} {"current_steps": 7760, "total_steps": 40000, "loss": 0.0598, "lr": 0.2729995598265718, "epoch": 0.3791561820535998, "percentage": 19.4, "elapsed_time": "8:05:01", "remaining_time": "1 day, 9:35:05", "throughput": 338.29, "total_tokens": 9844640} {"current_steps": 7765, "total_steps": 40000, "loss": 0.0423, "lr": 0.2729658351014027, "epoch": 0.3794004837172941, "percentage": 19.41, "elapsed_time": "8:05:04", "remaining_time": "1 day, 9:33:42", "throughput": 338.49, "total_tokens": 9851552} {"current_steps": 7770, "total_steps": 40000, "loss": 0.0565, "lr": 0.27293209141335656, "epoch": 0.37964478538098845, "percentage": 19.43, "elapsed_time": "8:05:07", "remaining_time": "1 day, 9:32:18", "throughput": 338.67, "total_tokens": 9857792} {"current_steps": 7775, "total_steps": 40000, "loss": 0.055, "lr": 0.27289832876763703, "epoch": 0.37988908704468277, "percentage": 19.44, "elapsed_time": "8:05:10", "remaining_time": "1 day, 9:30:54", "throughput": 338.84, "total_tokens": 9863776} {"current_steps": 7780, "total_steps": 40000, "loss": 0.0726, "lr": 0.27286454716945074, "epoch": 0.3801333887083771, "percentage": 19.45, "elapsed_time": "8:05:13", "remaining_time": "1 day, 9:29:30", "throughput": 339.02, "total_tokens": 9869984} {"current_steps": 7785, "total_steps": 40000, "loss": 0.088, "lr": 0.27283074662400725, "epoch": 0.3803776903720714, "percentage": 19.46, "elapsed_time": "8:05:16", "remaining_time": "1 day, 9:28:07", "throughput": 339.19, "total_tokens": 9876224} {"current_steps": 7790, "total_steps": 40000, "loss": 0.0631, "lr": 0.2727969271365191, "epoch": 0.38062199203576574, "percentage": 19.48, "elapsed_time": "8:05:19", "remaining_time": "1 day, 9:26:43", "throughput": 339.37, "total_tokens": 9882304} {"current_steps": 7795, "total_steps": 40000, "loss": 0.0703, "lr": 0.2727630887122016, "epoch": 0.38086629369946007, "percentage": 19.49, "elapsed_time": "8:05:22", "remaining_time": "1 day, 9:25:20", "throughput": 339.54, "total_tokens": 9888320} {"current_steps": 7800, "total_steps": 40000, "loss": 0.0794, "lr": 0.27272923135627314, "epoch": 0.38111059536315445, "percentage": 19.5, "elapsed_time": "8:05:25", "remaining_time": "1 day, 9:23:57", "throughput": 339.72, "total_tokens": 9894624} {"current_steps": 7800, "total_steps": 40000, "eval_loss": 0.07448570430278778, "epoch": 0.38111059536315445, "percentage": 19.5, "elapsed_time": "8:16:04", "remaining_time": "1 day, 10:07:54", "throughput": 332.43, "total_tokens": 9894624} {"current_steps": 7805, "total_steps": 40000, "loss": 0.074, "lr": 0.2726953550739548, "epoch": 0.38135489702684877, "percentage": 19.51, "elapsed_time": "8:16:08", "remaining_time": "1 day, 10:06:31", "throughput": 332.6, "total_tokens": 9900800} {"current_steps": 7810, "total_steps": 40000, "loss": 0.0807, "lr": 0.27266145987047086, "epoch": 0.3815991986905431, "percentage": 19.53, "elapsed_time": "8:16:11", "remaining_time": "1 day, 10:05:07", "throughput": 332.78, "total_tokens": 9907392} {"current_steps": 7815, "total_steps": 40000, "loss": 0.0539, "lr": 0.27262754575104836, "epoch": 0.3818435003542374, "percentage": 19.54, "elapsed_time": "8:16:14", "remaining_time": "1 day, 10:03:42", "throughput": 332.97, "total_tokens": 9913920} {"current_steps": 7820, "total_steps": 40000, "loss": 0.107, "lr": 0.27259361272091726, "epoch": 0.38208780201793174, "percentage": 19.55, "elapsed_time": "8:16:17", "remaining_time": "1 day, 10:02:17", "throughput": 333.14, "total_tokens": 9920032} {"current_steps": 7825, "total_steps": 40000, "loss": 0.0938, "lr": 0.27255966078531046, "epoch": 0.38233210368162607, "percentage": 19.56, "elapsed_time": "8:16:20", "remaining_time": "1 day, 10:00:53", "throughput": 333.32, "total_tokens": 9926464} {"current_steps": 7830, "total_steps": 40000, "loss": 0.0932, "lr": 0.2725256899494638, "epoch": 0.3825764053453204, "percentage": 19.57, "elapsed_time": "8:16:23", "remaining_time": "1 day, 9:59:28", "throughput": 333.5, "total_tokens": 9932896} {"current_steps": 7835, "total_steps": 40000, "loss": 0.0583, "lr": 0.272491700218616, "epoch": 0.3828207070090147, "percentage": 19.59, "elapsed_time": "8:16:27", "remaining_time": "1 day, 9:58:04", "throughput": 333.69, "total_tokens": 9939744} {"current_steps": 7840, "total_steps": 40000, "loss": 0.1052, "lr": 0.27245769159800876, "epoch": 0.38306500867270904, "percentage": 19.6, "elapsed_time": "8:16:30", "remaining_time": "1 day, 9:56:40", "throughput": 333.87, "total_tokens": 9946048} {"current_steps": 7845, "total_steps": 40000, "loss": 0.0891, "lr": 0.2724236640928865, "epoch": 0.38330931033640336, "percentage": 19.61, "elapsed_time": "8:16:33", "remaining_time": "1 day, 9:55:16", "throughput": 334.05, "total_tokens": 9952416} {"current_steps": 7850, "total_steps": 40000, "loss": 0.0903, "lr": 0.27238961770849673, "epoch": 0.38355361200009774, "percentage": 19.62, "elapsed_time": "8:16:36", "remaining_time": "1 day, 9:53:51", "throughput": 334.22, "total_tokens": 9958656} {"current_steps": 7855, "total_steps": 40000, "loss": 0.0853, "lr": 0.27235555245008997, "epoch": 0.38379791366379207, "percentage": 19.64, "elapsed_time": "8:16:39", "remaining_time": "1 day, 9:52:27", "throughput": 334.38, "total_tokens": 9964192} {"current_steps": 7860, "total_steps": 40000, "loss": 0.0629, "lr": 0.2723214683229193, "epoch": 0.3840422153274864, "percentage": 19.65, "elapsed_time": "8:16:42", "remaining_time": "1 day, 9:51:03", "throughput": 334.56, "total_tokens": 9970496} {"current_steps": 7865, "total_steps": 40000, "loss": 0.124, "lr": 0.27228736533224107, "epoch": 0.3842865169911807, "percentage": 19.66, "elapsed_time": "8:16:45", "remaining_time": "1 day, 9:49:39", "throughput": 334.73, "total_tokens": 9976832} {"current_steps": 7870, "total_steps": 40000, "loss": 0.0862, "lr": 0.27225324348331437, "epoch": 0.38453081865487504, "percentage": 19.68, "elapsed_time": "8:16:48", "remaining_time": "1 day, 9:48:16", "throughput": 334.92, "total_tokens": 9983424} {"current_steps": 7875, "total_steps": 40000, "loss": 0.071, "lr": 0.27221910278140116, "epoch": 0.38477512031856936, "percentage": 19.69, "elapsed_time": "8:16:51", "remaining_time": "1 day, 9:46:52", "throughput": 335.1, "total_tokens": 9990016} {"current_steps": 7880, "total_steps": 40000, "loss": 0.0629, "lr": 0.2721849432317664, "epoch": 0.3850194219822637, "percentage": 19.7, "elapsed_time": "8:16:54", "remaining_time": "1 day, 9:45:29", "throughput": 335.28, "total_tokens": 9996448} {"current_steps": 7885, "total_steps": 40000, "loss": 0.068, "lr": 0.2721507648396779, "epoch": 0.385263723645958, "percentage": 19.71, "elapsed_time": "8:16:57", "remaining_time": "1 day, 9:44:06", "throughput": 335.46, "total_tokens": 10002656} {"current_steps": 7890, "total_steps": 40000, "loss": 0.0966, "lr": 0.27211656761040653, "epoch": 0.38550802530965234, "percentage": 19.73, "elapsed_time": "8:17:00", "remaining_time": "1 day, 9:42:42", "throughput": 335.64, "total_tokens": 10009088} {"current_steps": 7895, "total_steps": 40000, "loss": 0.0782, "lr": 0.2720823515492257, "epoch": 0.3857523269733467, "percentage": 19.74, "elapsed_time": "8:17:03", "remaining_time": "1 day, 9:41:19", "throughput": 335.8, "total_tokens": 10014912} {"current_steps": 7900, "total_steps": 40000, "loss": 0.0789, "lr": 0.27204811666141215, "epoch": 0.38599662863704104, "percentage": 19.75, "elapsed_time": "8:17:07", "remaining_time": "1 day, 9:39:56", "throughput": 335.98, "total_tokens": 10021216} {"current_steps": 7905, "total_steps": 40000, "loss": 0.0935, "lr": 0.2720138629522452, "epoch": 0.38624093030073536, "percentage": 19.76, "elapsed_time": "8:17:10", "remaining_time": "1 day, 9:38:33", "throughput": 336.15, "total_tokens": 10027488} {"current_steps": 7910, "total_steps": 40000, "loss": 0.0824, "lr": 0.2719795904270073, "epoch": 0.3864852319644297, "percentage": 19.78, "elapsed_time": "8:17:13", "remaining_time": "1 day, 9:37:10", "throughput": 336.33, "total_tokens": 10033856} {"current_steps": 7915, "total_steps": 40000, "loss": 0.0657, "lr": 0.2719452990909837, "epoch": 0.386729533628124, "percentage": 19.79, "elapsed_time": "8:17:16", "remaining_time": "1 day, 9:35:47", "throughput": 336.51, "total_tokens": 10040416} {"current_steps": 7920, "total_steps": 40000, "loss": 0.0555, "lr": 0.2719109889494625, "epoch": 0.38697383529181834, "percentage": 19.8, "elapsed_time": "8:17:19", "remaining_time": "1 day, 9:34:24", "throughput": 336.68, "total_tokens": 10046272} {"current_steps": 7925, "total_steps": 40000, "loss": 0.0736, "lr": 0.27187666000773475, "epoch": 0.38721813695551266, "percentage": 19.81, "elapsed_time": "8:17:22", "remaining_time": "1 day, 9:33:01", "throughput": 336.85, "total_tokens": 10052416} {"current_steps": 7930, "total_steps": 40000, "loss": 0.0615, "lr": 0.2718423122710944, "epoch": 0.387462438619207, "percentage": 19.82, "elapsed_time": "8:17:25", "remaining_time": "1 day, 9:31:39", "throughput": 337.02, "total_tokens": 10058432} {"current_steps": 7935, "total_steps": 40000, "loss": 0.0557, "lr": 0.2718079457448384, "epoch": 0.3877067402829013, "percentage": 19.84, "elapsed_time": "8:17:28", "remaining_time": "1 day, 9:30:16", "throughput": 337.2, "total_tokens": 10064992} {"current_steps": 7940, "total_steps": 40000, "loss": 0.0799, "lr": 0.27177356043426637, "epoch": 0.38795104194659563, "percentage": 19.85, "elapsed_time": "8:17:31", "remaining_time": "1 day, 9:28:54", "throughput": 337.35, "total_tokens": 10070464} {"current_steps": 7945, "total_steps": 40000, "loss": 0.081, "lr": 0.27173915634468104, "epoch": 0.38819534361029, "percentage": 19.86, "elapsed_time": "8:17:34", "remaining_time": "1 day, 9:27:31", "throughput": 337.53, "total_tokens": 10076704} {"current_steps": 7950, "total_steps": 40000, "loss": 0.0699, "lr": 0.27170473348138796, "epoch": 0.38843964527398434, "percentage": 19.88, "elapsed_time": "8:17:37", "remaining_time": "1 day, 9:26:09", "throughput": 337.71, "total_tokens": 10083104} {"current_steps": 7955, "total_steps": 40000, "loss": 0.1022, "lr": 0.27167029184969554, "epoch": 0.38868394693767866, "percentage": 19.89, "elapsed_time": "8:17:40", "remaining_time": "1 day, 9:24:47", "throughput": 337.87, "total_tokens": 10089184} {"current_steps": 7960, "total_steps": 40000, "loss": 0.0535, "lr": 0.27163583145491504, "epoch": 0.388928248601373, "percentage": 19.9, "elapsed_time": "8:17:43", "remaining_time": "1 day, 9:23:25", "throughput": 338.04, "total_tokens": 10095040} {"current_steps": 7965, "total_steps": 40000, "loss": 0.0957, "lr": 0.2716013523023608, "epoch": 0.3891725502650673, "percentage": 19.91, "elapsed_time": "8:17:46", "remaining_time": "1 day, 9:22:03", "throughput": 338.2, "total_tokens": 10100928} {"current_steps": 7970, "total_steps": 40000, "loss": 0.0635, "lr": 0.27156685439734995, "epoch": 0.38941685192876163, "percentage": 19.93, "elapsed_time": "8:17:49", "remaining_time": "1 day, 9:20:41", "throughput": 338.38, "total_tokens": 10107264} {"current_steps": 7975, "total_steps": 40000, "loss": 0.0731, "lr": 0.2715323377452024, "epoch": 0.38966115359245596, "percentage": 19.94, "elapsed_time": "8:17:52", "remaining_time": "1 day, 9:19:19", "throughput": 338.55, "total_tokens": 10113568} {"current_steps": 7980, "total_steps": 40000, "loss": 0.1001, "lr": 0.2714978023512411, "epoch": 0.3899054552561503, "percentage": 19.95, "elapsed_time": "8:17:56", "remaining_time": "1 day, 9:17:58", "throughput": 338.73, "total_tokens": 10119904} {"current_steps": 7985, "total_steps": 40000, "loss": 0.0583, "lr": 0.2714632482207918, "epoch": 0.3901497569198446, "percentage": 19.96, "elapsed_time": "8:17:59", "remaining_time": "1 day, 9:16:36", "throughput": 338.9, "total_tokens": 10126048} {"current_steps": 7990, "total_steps": 40000, "loss": 0.0689, "lr": 0.2714286753591833, "epoch": 0.3903940585835389, "percentage": 19.98, "elapsed_time": "8:18:02", "remaining_time": "1 day, 9:15:15", "throughput": 339.08, "total_tokens": 10132288} {"current_steps": 7995, "total_steps": 40000, "loss": 0.0659, "lr": 0.27139408377174706, "epoch": 0.3906383602472333, "percentage": 19.99, "elapsed_time": "8:18:05", "remaining_time": "1 day, 9:13:54", "throughput": 339.25, "total_tokens": 10138400} {"current_steps": 8000, "total_steps": 40000, "loss": 0.0653, "lr": 0.27135947346381756, "epoch": 0.39088266191092763, "percentage": 20.0, "elapsed_time": "8:18:08", "remaining_time": "1 day, 9:12:32", "throughput": 339.41, "total_tokens": 10144480} {"current_steps": 8000, "total_steps": 40000, "eval_loss": 0.07233572751283646, "epoch": 0.39088266191092763, "percentage": 20.0, "elapsed_time": "8:28:47", "remaining_time": "1 day, 9:55:08", "throughput": 332.31, "total_tokens": 10144480} {"current_steps": 8005, "total_steps": 40000, "loss": 0.0814, "lr": 0.2713248444407322, "epoch": 0.39112696357462196, "percentage": 20.01, "elapsed_time": "8:28:50", "remaining_time": "1 day, 9:53:47", "throughput": 332.47, "total_tokens": 10150432} {"current_steps": 8010, "total_steps": 40000, "loss": 0.0719, "lr": 0.27129019670783106, "epoch": 0.3913712652383163, "percentage": 20.03, "elapsed_time": "8:28:54", "remaining_time": "1 day, 9:52:25", "throughput": 332.67, "total_tokens": 10157600} {"current_steps": 8015, "total_steps": 40000, "loss": 0.0592, "lr": 0.27125553027045746, "epoch": 0.3916155669020106, "percentage": 20.04, "elapsed_time": "8:28:57", "remaining_time": "1 day, 9:51:02", "throughput": 332.85, "total_tokens": 10164384} {"current_steps": 8020, "total_steps": 40000, "loss": 0.0838, "lr": 0.2712208451339572, "epoch": 0.3918598685657049, "percentage": 20.05, "elapsed_time": "8:29:00", "remaining_time": "1 day, 9:49:39", "throughput": 333.01, "total_tokens": 10170144} {"current_steps": 8025, "total_steps": 40000, "loss": 0.0771, "lr": 0.27118614130367935, "epoch": 0.39210417022939925, "percentage": 20.06, "elapsed_time": "8:29:03", "remaining_time": "1 day, 9:48:16", "throughput": 333.16, "total_tokens": 10175872} {"current_steps": 8030, "total_steps": 40000, "loss": 0.0592, "lr": 0.2711514187849756, "epoch": 0.3923484718930936, "percentage": 20.08, "elapsed_time": "8:29:06", "remaining_time": "1 day, 9:46:54", "throughput": 333.35, "total_tokens": 10182464} {"current_steps": 8035, "total_steps": 40000, "loss": 0.0569, "lr": 0.27111667758320057, "epoch": 0.3925927735567879, "percentage": 20.09, "elapsed_time": "8:29:09", "remaining_time": "1 day, 9:45:32", "throughput": 333.53, "total_tokens": 10189056} {"current_steps": 8040, "total_steps": 40000, "loss": 0.0859, "lr": 0.27108191770371176, "epoch": 0.3928370752204823, "percentage": 20.1, "elapsed_time": "8:29:12", "remaining_time": "1 day, 9:44:10", "throughput": 333.71, "total_tokens": 10195584} {"current_steps": 8045, "total_steps": 40000, "loss": 0.0778, "lr": 0.2710471391518697, "epoch": 0.3930813768841766, "percentage": 20.11, "elapsed_time": "8:29:15", "remaining_time": "1 day, 9:42:48", "throughput": 333.9, "total_tokens": 10202496} {"current_steps": 8050, "total_steps": 40000, "loss": 0.0364, "lr": 0.2710123419330375, "epoch": 0.3933256785478709, "percentage": 20.12, "elapsed_time": "8:29:18", "remaining_time": "1 day, 9:41:26", "throughput": 334.07, "total_tokens": 10208864} {"current_steps": 8055, "total_steps": 40000, "loss": 0.05, "lr": 0.2709775260525816, "epoch": 0.39356998021156525, "percentage": 20.14, "elapsed_time": "8:29:21", "remaining_time": "1 day, 9:40:04", "throughput": 334.24, "total_tokens": 10215040} {"current_steps": 8060, "total_steps": 40000, "loss": 0.051, "lr": 0.27094269151587075, "epoch": 0.3938142818752596, "percentage": 20.15, "elapsed_time": "8:29:25", "remaining_time": "1 day, 9:38:42", "throughput": 334.42, "total_tokens": 10221664} {"current_steps": 8065, "total_steps": 40000, "loss": 0.077, "lr": 0.27090783832827703, "epoch": 0.3940585835389539, "percentage": 20.16, "elapsed_time": "8:29:28", "remaining_time": "1 day, 9:37:20", "throughput": 334.6, "total_tokens": 10228000} {"current_steps": 8070, "total_steps": 40000, "loss": 0.0602, "lr": 0.2708729664951753, "epoch": 0.3943028852026482, "percentage": 20.18, "elapsed_time": "8:29:31", "remaining_time": "1 day, 9:35:59", "throughput": 334.8, "total_tokens": 10235232} {"current_steps": 8075, "total_steps": 40000, "loss": 0.0623, "lr": 0.27083807602194304, "epoch": 0.39454718686634255, "percentage": 20.19, "elapsed_time": "8:29:34", "remaining_time": "1 day, 9:34:38", "throughput": 334.98, "total_tokens": 10241888} {"current_steps": 8080, "total_steps": 40000, "loss": 0.0721, "lr": 0.270803166913961, "epoch": 0.39479148853003687, "percentage": 20.2, "elapsed_time": "8:29:37", "remaining_time": "1 day, 9:33:17", "throughput": 335.16, "total_tokens": 10248352} {"current_steps": 8085, "total_steps": 40000, "loss": 0.0664, "lr": 0.27076823917661247, "epoch": 0.3950357901937312, "percentage": 20.21, "elapsed_time": "8:29:40", "remaining_time": "1 day, 9:31:55", "throughput": 335.33, "total_tokens": 10254560} {"current_steps": 8090, "total_steps": 40000, "loss": 0.0858, "lr": 0.2707332928152838, "epoch": 0.3952800918574256, "percentage": 20.23, "elapsed_time": "8:29:43", "remaining_time": "1 day, 9:30:34", "throughput": 335.49, "total_tokens": 10260608} {"current_steps": 8095, "total_steps": 40000, "loss": 0.0665, "lr": 0.2706983278353641, "epoch": 0.3955243935211199, "percentage": 20.24, "elapsed_time": "8:29:46", "remaining_time": "1 day, 9:29:12", "throughput": 335.66, "total_tokens": 10266720} {"current_steps": 8100, "total_steps": 40000, "loss": 0.0741, "lr": 0.27066334424224553, "epoch": 0.3957686951848142, "percentage": 20.25, "elapsed_time": "8:29:49", "remaining_time": "1 day, 9:27:51", "throughput": 335.82, "total_tokens": 10272864} {"current_steps": 8105, "total_steps": 40000, "loss": 0.0972, "lr": 0.27062834204132297, "epoch": 0.39601299684850855, "percentage": 20.26, "elapsed_time": "8:29:53", "remaining_time": "1 day, 9:26:30", "throughput": 335.99, "total_tokens": 10279008} {"current_steps": 8110, "total_steps": 40000, "loss": 0.0562, "lr": 0.27059332123799407, "epoch": 0.39625729851220287, "percentage": 20.28, "elapsed_time": "8:29:56", "remaining_time": "1 day, 9:25:09", "throughput": 336.17, "total_tokens": 10285440} {"current_steps": 8115, "total_steps": 40000, "loss": 0.0506, "lr": 0.27055828183765956, "epoch": 0.3965016001758972, "percentage": 20.29, "elapsed_time": "8:29:59", "remaining_time": "1 day, 9:23:48", "throughput": 336.35, "total_tokens": 10291968} {"current_steps": 8120, "total_steps": 40000, "loss": 0.0713, "lr": 0.270523223845723, "epoch": 0.3967459018395915, "percentage": 20.3, "elapsed_time": "8:30:02", "remaining_time": "1 day, 9:22:27", "throughput": 336.52, "total_tokens": 10298208} {"current_steps": 8125, "total_steps": 40000, "loss": 0.059, "lr": 0.2704881472675907, "epoch": 0.39699020350328584, "percentage": 20.31, "elapsed_time": "8:30:05", "remaining_time": "1 day, 9:21:07", "throughput": 336.7, "total_tokens": 10304960} {"current_steps": 8130, "total_steps": 40000, "loss": 0.0549, "lr": 0.270453052108672, "epoch": 0.39723450516698017, "percentage": 20.32, "elapsed_time": "8:30:08", "remaining_time": "1 day, 9:19:46", "throughput": 336.87, "total_tokens": 10310976} {"current_steps": 8135, "total_steps": 40000, "loss": 0.0597, "lr": 0.2704179383743789, "epoch": 0.3974788068306745, "percentage": 20.34, "elapsed_time": "8:30:11", "remaining_time": "1 day, 9:18:26", "throughput": 337.04, "total_tokens": 10317248} {"current_steps": 8140, "total_steps": 40000, "loss": 0.0396, "lr": 0.27038280607012644, "epoch": 0.39772310849436887, "percentage": 20.35, "elapsed_time": "8:30:14", "remaining_time": "1 day, 9:17:06", "throughput": 337.22, "total_tokens": 10323872} {"current_steps": 8145, "total_steps": 40000, "loss": 0.1088, "lr": 0.27034765520133247, "epoch": 0.3979674101580632, "percentage": 20.36, "elapsed_time": "8:30:17", "remaining_time": "1 day, 9:15:45", "throughput": 337.38, "total_tokens": 10329824} {"current_steps": 8150, "total_steps": 40000, "loss": 0.0502, "lr": 0.2703124857734177, "epoch": 0.3982117118217575, "percentage": 20.38, "elapsed_time": "8:30:20", "remaining_time": "1 day, 9:14:25", "throughput": 337.54, "total_tokens": 10335744} {"current_steps": 8155, "total_steps": 40000, "loss": 0.0628, "lr": 0.27027729779180565, "epoch": 0.39845601348545184, "percentage": 20.39, "elapsed_time": "8:30:23", "remaining_time": "1 day, 9:13:04", "throughput": 337.71, "total_tokens": 10341824} {"current_steps": 8160, "total_steps": 40000, "loss": 0.0646, "lr": 0.27024209126192283, "epoch": 0.39870031514914617, "percentage": 20.4, "elapsed_time": "8:30:26", "remaining_time": "1 day, 9:11:45", "throughput": 337.9, "total_tokens": 10348736} {"current_steps": 8165, "total_steps": 40000, "loss": 0.0734, "lr": 0.2702068661891984, "epoch": 0.3989446168128405, "percentage": 20.41, "elapsed_time": "8:30:30", "remaining_time": "1 day, 9:10:25", "throughput": 338.07, "total_tokens": 10355168} {"current_steps": 8170, "total_steps": 40000, "loss": 0.0727, "lr": 0.2701716225790647, "epoch": 0.3991889184765348, "percentage": 20.42, "elapsed_time": "8:30:33", "remaining_time": "1 day, 9:09:05", "throughput": 338.26, "total_tokens": 10362144} {"current_steps": 8175, "total_steps": 40000, "loss": 0.0602, "lr": 0.27013636043695655, "epoch": 0.39943322014022914, "percentage": 20.44, "elapsed_time": "8:30:36", "remaining_time": "1 day, 9:07:45", "throughput": 338.43, "total_tokens": 10368288} {"current_steps": 8180, "total_steps": 40000, "loss": 0.0861, "lr": 0.27010107976831194, "epoch": 0.39967752180392346, "percentage": 20.45, "elapsed_time": "8:30:39", "remaining_time": "1 day, 9:06:25", "throughput": 338.58, "total_tokens": 10373856} {"current_steps": 8185, "total_steps": 40000, "loss": 0.0769, "lr": 0.2700657805785715, "epoch": 0.3999218234676178, "percentage": 20.46, "elapsed_time": "8:30:42", "remaining_time": "1 day, 9:05:06", "throughput": 338.74, "total_tokens": 10379840} {"current_steps": 8190, "total_steps": 40000, "loss": 0.0464, "lr": 0.2700304628731789, "epoch": 0.40016612513131217, "percentage": 20.47, "elapsed_time": "8:30:45", "remaining_time": "1 day, 9:03:46", "throughput": 338.92, "total_tokens": 10386368} {"current_steps": 8195, "total_steps": 40000, "loss": 0.0656, "lr": 0.26999512665758046, "epoch": 0.4004104267950065, "percentage": 20.49, "elapsed_time": "8:30:48", "remaining_time": "1 day, 9:02:27", "throughput": 339.08, "total_tokens": 10392320} {"current_steps": 8200, "total_steps": 40000, "loss": 0.0635, "lr": 0.2699597719372256, "epoch": 0.4006547284587008, "percentage": 20.5, "elapsed_time": "8:30:51", "remaining_time": "1 day, 9:01:07", "throughput": 339.25, "total_tokens": 10398432} {"current_steps": 8200, "total_steps": 40000, "eval_loss": 0.07274027913808823, "epoch": 0.4006547284587008, "percentage": 20.5, "elapsed_time": "8:41:30", "remaining_time": "1 day, 9:42:26", "throughput": 332.32, "total_tokens": 10398432} {"current_steps": 8205, "total_steps": 40000, "loss": 0.0571, "lr": 0.26992439871756635, "epoch": 0.40089903012239514, "percentage": 20.51, "elapsed_time": "8:41:34", "remaining_time": "1 day, 9:41:08", "throughput": 332.49, "total_tokens": 10404992} {"current_steps": 8210, "total_steps": 40000, "loss": 0.067, "lr": 0.2698890070040578, "epoch": 0.40114333178608946, "percentage": 20.52, "elapsed_time": "8:41:37", "remaining_time": "1 day, 9:39:47", "throughput": 332.66, "total_tokens": 10411424} {"current_steps": 8215, "total_steps": 40000, "loss": 0.0551, "lr": 0.2698535968021577, "epoch": 0.4013876334497838, "percentage": 20.54, "elapsed_time": "8:41:40", "remaining_time": "1 day, 9:38:26", "throughput": 332.83, "total_tokens": 10417760} {"current_steps": 8220, "total_steps": 40000, "loss": 0.0557, "lr": 0.26981816811732684, "epoch": 0.4016319351134781, "percentage": 20.55, "elapsed_time": "8:41:43", "remaining_time": "1 day, 9:37:06", "throughput": 332.99, "total_tokens": 10423808} {"current_steps": 8225, "total_steps": 40000, "loss": 0.0607, "lr": 0.26978272095502875, "epoch": 0.40187623677717244, "percentage": 20.56, "elapsed_time": "8:41:46", "remaining_time": "1 day, 9:35:45", "throughput": 333.15, "total_tokens": 10429856} {"current_steps": 8230, "total_steps": 40000, "loss": 0.091, "lr": 0.26974725532072974, "epoch": 0.40212053844086676, "percentage": 20.57, "elapsed_time": "8:41:49", "remaining_time": "1 day, 9:34:24", "throughput": 333.31, "total_tokens": 10435872} {"current_steps": 8235, "total_steps": 40000, "loss": 0.0777, "lr": 0.26971177121989914, "epoch": 0.40236484010456114, "percentage": 20.59, "elapsed_time": "8:41:52", "remaining_time": "1 day, 9:33:03", "throughput": 333.48, "total_tokens": 10442176} {"current_steps": 8240, "total_steps": 40000, "loss": 0.0872, "lr": 0.2696762686580091, "epoch": 0.40260914176825546, "percentage": 20.6, "elapsed_time": "8:41:55", "remaining_time": "1 day, 9:31:42", "throughput": 333.63, "total_tokens": 10447776} {"current_steps": 8245, "total_steps": 40000, "loss": 0.0815, "lr": 0.26964074764053436, "epoch": 0.4028534434319498, "percentage": 20.61, "elapsed_time": "8:41:58", "remaining_time": "1 day, 9:30:22", "throughput": 333.78, "total_tokens": 10453760} {"current_steps": 8250, "total_steps": 40000, "loss": 0.0715, "lr": 0.2696052081729529, "epoch": 0.4030977450956441, "percentage": 20.62, "elapsed_time": "8:42:01", "remaining_time": "1 day, 9:29:01", "throughput": 333.96, "total_tokens": 10460128} {"current_steps": 8255, "total_steps": 40000, "loss": 0.0477, "lr": 0.2695696502607453, "epoch": 0.40334204675933844, "percentage": 20.64, "elapsed_time": "8:42:05", "remaining_time": "1 day, 9:27:41", "throughput": 334.13, "total_tokens": 10466688} {"current_steps": 8260, "total_steps": 40000, "loss": 0.0949, "lr": 0.26953407390939504, "epoch": 0.40358634842303276, "percentage": 20.65, "elapsed_time": "8:42:08", "remaining_time": "1 day, 9:26:21", "throughput": 334.3, "total_tokens": 10473088} {"current_steps": 8265, "total_steps": 40000, "loss": 0.0375, "lr": 0.26949847912438835, "epoch": 0.4038306500867271, "percentage": 20.66, "elapsed_time": "8:42:11", "remaining_time": "1 day, 9:25:01", "throughput": 334.46, "total_tokens": 10479040} {"current_steps": 8270, "total_steps": 40000, "loss": 0.0638, "lr": 0.26946286591121454, "epoch": 0.4040749517504214, "percentage": 20.67, "elapsed_time": "8:42:14", "remaining_time": "1 day, 9:23:41", "throughput": 334.62, "total_tokens": 10484896} {"current_steps": 8275, "total_steps": 40000, "loss": 0.0669, "lr": 0.2694272342753655, "epoch": 0.40431925341411573, "percentage": 20.69, "elapsed_time": "8:42:17", "remaining_time": "1 day, 9:22:21", "throughput": 334.77, "total_tokens": 10490912} {"current_steps": 8280, "total_steps": 40000, "loss": 0.0854, "lr": 0.26939158422233617, "epoch": 0.40456355507781006, "percentage": 20.7, "elapsed_time": "8:42:20", "remaining_time": "1 day, 9:21:02", "throughput": 334.95, "total_tokens": 10497536} {"current_steps": 8285, "total_steps": 40000, "loss": 0.0788, "lr": 0.26935591575762413, "epoch": 0.40480785674150443, "percentage": 20.71, "elapsed_time": "8:42:23", "remaining_time": "1 day, 9:19:42", "throughput": 335.12, "total_tokens": 10503840} {"current_steps": 8290, "total_steps": 40000, "loss": 0.0667, "lr": 0.26932022888672996, "epoch": 0.40505215840519876, "percentage": 20.72, "elapsed_time": "8:42:26", "remaining_time": "1 day, 9:18:23", "throughput": 335.29, "total_tokens": 10510240} {"current_steps": 8295, "total_steps": 40000, "loss": 0.0876, "lr": 0.26928452361515703, "epoch": 0.4052964600688931, "percentage": 20.74, "elapsed_time": "8:42:29", "remaining_time": "1 day, 9:17:03", "throughput": 335.45, "total_tokens": 10516096} {"current_steps": 8300, "total_steps": 40000, "loss": 0.0708, "lr": 0.26924879994841155, "epoch": 0.4055407617325874, "percentage": 20.75, "elapsed_time": "8:42:32", "remaining_time": "1 day, 9:15:44", "throughput": 335.61, "total_tokens": 10522272} {"current_steps": 8305, "total_steps": 40000, "loss": 0.0519, "lr": 0.2692130578920025, "epoch": 0.40578506339628173, "percentage": 20.76, "elapsed_time": "8:42:35", "remaining_time": "1 day, 9:14:25", "throughput": 335.79, "total_tokens": 10529088} {"current_steps": 8310, "total_steps": 40000, "loss": 0.0734, "lr": 0.26917729745144187, "epoch": 0.40602936505997606, "percentage": 20.77, "elapsed_time": "8:42:38", "remaining_time": "1 day, 9:13:06", "throughput": 335.96, "total_tokens": 10535424} {"current_steps": 8315, "total_steps": 40000, "loss": 0.067, "lr": 0.2691415186322443, "epoch": 0.4062736667236704, "percentage": 20.79, "elapsed_time": "8:42:41", "remaining_time": "1 day, 9:11:47", "throughput": 336.13, "total_tokens": 10541696} {"current_steps": 8320, "total_steps": 40000, "loss": 0.0968, "lr": 0.2691057214399273, "epoch": 0.4065179683873647, "percentage": 20.8, "elapsed_time": "8:42:44", "remaining_time": "1 day, 9:10:27", "throughput": 336.28, "total_tokens": 10547552} {"current_steps": 8325, "total_steps": 40000, "loss": 0.0624, "lr": 0.2690699058800113, "epoch": 0.406762270051059, "percentage": 20.81, "elapsed_time": "8:42:48", "remaining_time": "1 day, 9:09:09", "throughput": 336.46, "total_tokens": 10554240} {"current_steps": 8330, "total_steps": 40000, "loss": 0.0793, "lr": 0.2690340719580194, "epoch": 0.40700657171475335, "percentage": 20.82, "elapsed_time": "8:42:51", "remaining_time": "1 day, 9:07:50", "throughput": 336.64, "total_tokens": 10560896} {"current_steps": 8335, "total_steps": 40000, "loss": 0.0614, "lr": 0.2689982196794778, "epoch": 0.40725087337844773, "percentage": 20.84, "elapsed_time": "8:42:54", "remaining_time": "1 day, 9:06:32", "throughput": 336.8, "total_tokens": 10566944} {"current_steps": 8340, "total_steps": 40000, "loss": 0.0653, "lr": 0.2689623490499153, "epoch": 0.40749517504214205, "percentage": 20.85, "elapsed_time": "8:42:57", "remaining_time": "1 day, 9:05:13", "throughput": 336.98, "total_tokens": 10573696} {"current_steps": 8345, "total_steps": 40000, "loss": 0.0662, "lr": 0.2689264600748636, "epoch": 0.4077394767058364, "percentage": 20.86, "elapsed_time": "8:43:00", "remaining_time": "1 day, 9:03:55", "throughput": 337.15, "total_tokens": 10580000} {"current_steps": 8350, "total_steps": 40000, "loss": 0.0491, "lr": 0.26889055275985724, "epoch": 0.4079837783695307, "percentage": 20.88, "elapsed_time": "8:43:03", "remaining_time": "1 day, 9:02:36", "throughput": 337.31, "total_tokens": 10586080} {"current_steps": 8355, "total_steps": 40000, "loss": 0.0592, "lr": 0.2688546271104335, "epoch": 0.408228080033225, "percentage": 20.89, "elapsed_time": "8:43:06", "remaining_time": "1 day, 9:01:18", "throughput": 337.49, "total_tokens": 10592672} {"current_steps": 8360, "total_steps": 40000, "loss": 0.0742, "lr": 0.26881868313213275, "epoch": 0.40847238169691935, "percentage": 20.9, "elapsed_time": "8:43:09", "remaining_time": "1 day, 9:00:00", "throughput": 337.65, "total_tokens": 10598656} {"current_steps": 8365, "total_steps": 40000, "loss": 0.0878, "lr": 0.2687827208304978, "epoch": 0.4087166833606137, "percentage": 20.91, "elapsed_time": "8:43:12", "remaining_time": "1 day, 8:58:42", "throughput": 337.85, "total_tokens": 10606048} {"current_steps": 8370, "total_steps": 40000, "loss": 0.0598, "lr": 0.26874674021107464, "epoch": 0.408960985024308, "percentage": 20.93, "elapsed_time": "8:43:16", "remaining_time": "1 day, 8:57:25", "throughput": 338.03, "total_tokens": 10612832} {"current_steps": 8375, "total_steps": 40000, "loss": 0.0805, "lr": 0.2687107412794118, "epoch": 0.4092052866880023, "percentage": 20.94, "elapsed_time": "8:43:19", "remaining_time": "1 day, 8:56:07", "throughput": 338.2, "total_tokens": 10619232} {"current_steps": 8380, "total_steps": 40000, "loss": 0.0697, "lr": 0.26867472404106096, "epoch": 0.4094495883516967, "percentage": 20.95, "elapsed_time": "8:43:22", "remaining_time": "1 day, 8:54:49", "throughput": 338.37, "total_tokens": 10625568} {"current_steps": 8385, "total_steps": 40000, "loss": 0.0657, "lr": 0.26863868850157624, "epoch": 0.409693890015391, "percentage": 20.96, "elapsed_time": "8:43:25", "remaining_time": "1 day, 8:53:31", "throughput": 338.55, "total_tokens": 10632160} {"current_steps": 8390, "total_steps": 40000, "loss": 0.0616, "lr": 0.26860263466651485, "epoch": 0.40993819167908535, "percentage": 20.97, "elapsed_time": "8:43:28", "remaining_time": "1 day, 8:52:13", "throughput": 338.71, "total_tokens": 10638208} {"current_steps": 8395, "total_steps": 40000, "loss": 0.0605, "lr": 0.26856656254143674, "epoch": 0.4101824933427797, "percentage": 20.99, "elapsed_time": "8:43:31", "remaining_time": "1 day, 8:50:56", "throughput": 338.87, "total_tokens": 10644480} {"current_steps": 8400, "total_steps": 40000, "loss": 0.0769, "lr": 0.2685304721319047, "epoch": 0.410426795006474, "percentage": 21.0, "elapsed_time": "8:43:34", "remaining_time": "1 day, 8:49:38", "throughput": 339.04, "total_tokens": 10650624} {"current_steps": 8400, "total_steps": 40000, "eval_loss": 0.07526280730962753, "epoch": 0.410426795006474, "percentage": 21.0, "elapsed_time": "8:54:14", "remaining_time": "1 day, 9:29:45", "throughput": 332.27, "total_tokens": 10650624} {"current_steps": 8405, "total_steps": 40000, "loss": 0.086, "lr": 0.2684943634434843, "epoch": 0.4106710966701683, "percentage": 21.01, "elapsed_time": "8:54:18", "remaining_time": "1 day, 9:28:30", "throughput": 332.43, "total_tokens": 10657120} {"current_steps": 8410, "total_steps": 40000, "loss": 0.0815, "lr": 0.268458236481744, "epoch": 0.41091539833386265, "percentage": 21.02, "elapsed_time": "8:54:21", "remaining_time": "1 day, 9:27:11", "throughput": 332.6, "total_tokens": 10663712} {"current_steps": 8415, "total_steps": 40000, "loss": 0.074, "lr": 0.2684220912522549, "epoch": 0.41115969999755697, "percentage": 21.04, "elapsed_time": "8:54:24", "remaining_time": "1 day, 9:25:51", "throughput": 332.74, "total_tokens": 10669280} {"current_steps": 8420, "total_steps": 40000, "loss": 0.0787, "lr": 0.2683859277605913, "epoch": 0.4114040016612513, "percentage": 21.05, "elapsed_time": "8:54:27", "remaining_time": "1 day, 9:24:32", "throughput": 332.9, "total_tokens": 10675232} {"current_steps": 8425, "total_steps": 40000, "loss": 0.0716, "lr": 0.2683497460123298, "epoch": 0.4116483033249456, "percentage": 21.06, "elapsed_time": "8:54:30", "remaining_time": "1 day, 9:23:13", "throughput": 333.06, "total_tokens": 10681600} {"current_steps": 8430, "total_steps": 40000, "loss": 0.0694, "lr": 0.26831354601305013, "epoch": 0.41189260498864, "percentage": 21.07, "elapsed_time": "8:54:33", "remaining_time": "1 day, 9:21:54", "throughput": 333.22, "total_tokens": 10687520} {"current_steps": 8435, "total_steps": 40000, "loss": 0.0672, "lr": 0.26827732776833496, "epoch": 0.4121369066523343, "percentage": 21.09, "elapsed_time": "8:54:36", "remaining_time": "1 day, 9:20:36", "throughput": 333.39, "total_tokens": 10694080} {"current_steps": 8440, "total_steps": 40000, "loss": 0.0632, "lr": 0.26824109128376944, "epoch": 0.41238120831602865, "percentage": 21.1, "elapsed_time": "8:54:39", "remaining_time": "1 day, 9:19:17", "throughput": 333.55, "total_tokens": 10700224} {"current_steps": 8445, "total_steps": 40000, "loss": 0.0783, "lr": 0.2682048365649417, "epoch": 0.41262550997972297, "percentage": 21.11, "elapsed_time": "8:54:42", "remaining_time": "1 day, 9:17:58", "throughput": 333.7, "total_tokens": 10706112} {"current_steps": 8450, "total_steps": 40000, "loss": 0.0684, "lr": 0.2681685636174428, "epoch": 0.4128698116434173, "percentage": 21.12, "elapsed_time": "8:54:45", "remaining_time": "1 day, 9:16:39", "throughput": 333.88, "total_tokens": 10712704} {"current_steps": 8455, "total_steps": 40000, "loss": 0.0727, "lr": 0.2681322724468663, "epoch": 0.4131141133071116, "percentage": 21.14, "elapsed_time": "8:54:48", "remaining_time": "1 day, 9:15:21", "throughput": 334.04, "total_tokens": 10719072} {"current_steps": 8460, "total_steps": 40000, "loss": 0.0754, "lr": 0.2680959630588089, "epoch": 0.41335841497080594, "percentage": 21.15, "elapsed_time": "8:54:52", "remaining_time": "1 day, 9:14:03", "throughput": 334.21, "total_tokens": 10725536} {"current_steps": 8465, "total_steps": 40000, "loss": 0.0732, "lr": 0.26805963545886985, "epoch": 0.41360271663450027, "percentage": 21.16, "elapsed_time": "8:54:55", "remaining_time": "1 day, 9:12:45", "throughput": 334.38, "total_tokens": 10732032} {"current_steps": 8470, "total_steps": 40000, "loss": 0.0688, "lr": 0.26802328965265143, "epoch": 0.4138470182981946, "percentage": 21.18, "elapsed_time": "8:54:58", "remaining_time": "1 day, 9:11:27", "throughput": 334.56, "total_tokens": 10738688} {"current_steps": 8475, "total_steps": 40000, "loss": 0.0672, "lr": 0.26798692564575854, "epoch": 0.4140913199618889, "percentage": 21.19, "elapsed_time": "8:55:01", "remaining_time": "1 day, 9:10:09", "throughput": 334.71, "total_tokens": 10744640} {"current_steps": 8480, "total_steps": 40000, "loss": 0.0831, "lr": 0.26795054344379904, "epoch": 0.4143356216255833, "percentage": 21.2, "elapsed_time": "8:55:04", "remaining_time": "1 day, 9:08:51", "throughput": 334.87, "total_tokens": 10750912} {"current_steps": 8485, "total_steps": 40000, "loss": 0.0667, "lr": 0.2679141430523835, "epoch": 0.4145799232892776, "percentage": 21.21, "elapsed_time": "8:55:07", "remaining_time": "1 day, 9:07:33", "throughput": 335.03, "total_tokens": 10756960} {"current_steps": 8490, "total_steps": 40000, "loss": 0.0832, "lr": 0.2678777244771252, "epoch": 0.41482422495297194, "percentage": 21.22, "elapsed_time": "8:55:10", "remaining_time": "1 day, 9:06:15", "throughput": 335.19, "total_tokens": 10763168} {"current_steps": 8495, "total_steps": 40000, "loss": 0.1004, "lr": 0.2678412877236405, "epoch": 0.41506852661666627, "percentage": 21.24, "elapsed_time": "8:55:13", "remaining_time": "1 day, 9:04:58", "throughput": 335.36, "total_tokens": 10769504} {"current_steps": 8500, "total_steps": 40000, "loss": 0.0822, "lr": 0.2678048327975484, "epoch": 0.4153128282803606, "percentage": 21.25, "elapsed_time": "8:55:16", "remaining_time": "1 day, 9:03:40", "throughput": 335.53, "total_tokens": 10776160} {"current_steps": 8505, "total_steps": 40000, "loss": 0.0587, "lr": 0.2677683597044706, "epoch": 0.4155571299440549, "percentage": 21.26, "elapsed_time": "8:55:19", "remaining_time": "1 day, 9:02:23", "throughput": 335.7, "total_tokens": 10782688} {"current_steps": 8510, "total_steps": 40000, "loss": 0.0885, "lr": 0.2677318684500318, "epoch": 0.41580143160774924, "percentage": 21.27, "elapsed_time": "8:55:22", "remaining_time": "1 day, 9:01:06", "throughput": 335.85, "total_tokens": 10788576} {"current_steps": 8515, "total_steps": 40000, "loss": 0.0685, "lr": 0.2676953590398593, "epoch": 0.41604573327144356, "percentage": 21.29, "elapsed_time": "8:55:25", "remaining_time": "1 day, 8:59:48", "throughput": 336.02, "total_tokens": 10794848} {"current_steps": 8520, "total_steps": 40000, "loss": 0.0694, "lr": 0.2676588314795834, "epoch": 0.4162900349351379, "percentage": 21.3, "elapsed_time": "8:55:29", "remaining_time": "1 day, 8:58:31", "throughput": 336.19, "total_tokens": 10801504} {"current_steps": 8525, "total_steps": 40000, "loss": 0.0945, "lr": 0.26762228577483715, "epoch": 0.4165343365988322, "percentage": 21.31, "elapsed_time": "8:55:32", "remaining_time": "1 day, 8:57:14", "throughput": 336.35, "total_tokens": 10807488} {"current_steps": 8530, "total_steps": 40000, "loss": 0.0519, "lr": 0.2675857219312563, "epoch": 0.4167786382625266, "percentage": 21.32, "elapsed_time": "8:55:35", "remaining_time": "1 day, 8:55:57", "throughput": 336.52, "total_tokens": 10814240} {"current_steps": 8535, "total_steps": 40000, "loss": 0.0449, "lr": 0.2675491399544794, "epoch": 0.4170229399262209, "percentage": 21.34, "elapsed_time": "8:55:38", "remaining_time": "1 day, 8:54:40", "throughput": 336.69, "total_tokens": 10820640} {"current_steps": 8540, "total_steps": 40000, "loss": 0.0695, "lr": 0.2675125398501479, "epoch": 0.41726724158991524, "percentage": 21.35, "elapsed_time": "8:55:41", "remaining_time": "1 day, 8:53:23", "throughput": 336.85, "total_tokens": 10826848} {"current_steps": 8545, "total_steps": 40000, "loss": 0.0696, "lr": 0.26747592162390604, "epoch": 0.41751154325360956, "percentage": 21.36, "elapsed_time": "8:55:44", "remaining_time": "1 day, 8:52:06", "throughput": 337.01, "total_tokens": 10832896} {"current_steps": 8550, "total_steps": 40000, "loss": 0.0528, "lr": 0.26743928528140076, "epoch": 0.4177558449173039, "percentage": 21.38, "elapsed_time": "8:55:47", "remaining_time": "1 day, 8:50:50", "throughput": 337.18, "total_tokens": 10839360} {"current_steps": 8555, "total_steps": 40000, "loss": 0.0799, "lr": 0.26740263082828186, "epoch": 0.4180001465809982, "percentage": 21.39, "elapsed_time": "8:55:50", "remaining_time": "1 day, 8:49:33", "throughput": 337.33, "total_tokens": 10845472} {"current_steps": 8560, "total_steps": 40000, "loss": 0.0681, "lr": 0.2673659582702019, "epoch": 0.41824444824469253, "percentage": 21.4, "elapsed_time": "8:55:53", "remaining_time": "1 day, 8:48:16", "throughput": 337.49, "total_tokens": 10851424} {"current_steps": 8565, "total_steps": 40000, "loss": 0.0507, "lr": 0.2673292676128163, "epoch": 0.41848874990838686, "percentage": 21.41, "elapsed_time": "8:55:56", "remaining_time": "1 day, 8:47:00", "throughput": 337.65, "total_tokens": 10857632} {"current_steps": 8570, "total_steps": 40000, "loss": 0.0629, "lr": 0.2672925588617831, "epoch": 0.4187330515720812, "percentage": 21.43, "elapsed_time": "8:55:59", "remaining_time": "1 day, 8:45:44", "throughput": 337.83, "total_tokens": 10864512} {"current_steps": 8575, "total_steps": 40000, "loss": 0.0506, "lr": 0.2672558320227634, "epoch": 0.41897735323577556, "percentage": 21.44, "elapsed_time": "8:56:02", "remaining_time": "1 day, 8:44:28", "throughput": 337.99, "total_tokens": 10870816} {"current_steps": 8580, "total_steps": 40000, "loss": 0.0763, "lr": 0.2672190871014209, "epoch": 0.4192216548994699, "percentage": 21.45, "elapsed_time": "8:56:06", "remaining_time": "1 day, 8:43:12", "throughput": 338.16, "total_tokens": 10877152} {"current_steps": 8585, "total_steps": 40000, "loss": 0.0571, "lr": 0.267182324103422, "epoch": 0.4194659565631642, "percentage": 21.46, "elapsed_time": "8:56:09", "remaining_time": "1 day, 8:41:56", "throughput": 338.32, "total_tokens": 10883552} {"current_steps": 8590, "total_steps": 40000, "loss": 0.0785, "lr": 0.2671455430344362, "epoch": 0.41971025822685853, "percentage": 21.48, "elapsed_time": "8:56:12", "remaining_time": "1 day, 8:40:40", "throughput": 338.48, "total_tokens": 10889760} {"current_steps": 8595, "total_steps": 40000, "loss": 0.057, "lr": 0.2671087439001355, "epoch": 0.41995455989055286, "percentage": 21.49, "elapsed_time": "8:56:15", "remaining_time": "1 day, 8:39:23", "throughput": 338.64, "total_tokens": 10895808} {"current_steps": 8600, "total_steps": 40000, "loss": 0.0831, "lr": 0.2670719267061948, "epoch": 0.4201988615542472, "percentage": 21.5, "elapsed_time": "8:56:18", "remaining_time": "1 day, 8:38:07", "throughput": 338.8, "total_tokens": 10901824} {"current_steps": 8600, "total_steps": 40000, "eval_loss": 0.07164221256971359, "epoch": 0.4201988615542472, "percentage": 21.5, "elapsed_time": "9:06:58", "remaining_time": "1 day, 9:17:04", "throughput": 332.19, "total_tokens": 10901824} {"current_steps": 8605, "total_steps": 40000, "loss": 0.031, "lr": 0.2670350914582918, "epoch": 0.4204431632179415, "percentage": 21.51, "elapsed_time": "9:07:02", "remaining_time": "1 day, 9:15:49", "throughput": 332.34, "total_tokens": 10908096} {"current_steps": 8610, "total_steps": 40000, "loss": 0.0616, "lr": 0.26699823816210694, "epoch": 0.42068746488163583, "percentage": 21.52, "elapsed_time": "9:07:05", "remaining_time": "1 day, 9:14:32", "throughput": 332.49, "total_tokens": 10914112} {"current_steps": 8615, "total_steps": 40000, "loss": 0.1017, "lr": 0.26696136682332344, "epoch": 0.42093176654533015, "percentage": 21.54, "elapsed_time": "9:07:08", "remaining_time": "1 day, 9:13:14", "throughput": 332.67, "total_tokens": 10920896} {"current_steps": 8620, "total_steps": 40000, "loss": 0.0779, "lr": 0.2669244774476274, "epoch": 0.4211760682090245, "percentage": 21.55, "elapsed_time": "9:07:11", "remaining_time": "1 day, 9:11:57", "throughput": 332.83, "total_tokens": 10927296} {"current_steps": 8625, "total_steps": 40000, "loss": 0.0882, "lr": 0.2668875700407075, "epoch": 0.42142036987271886, "percentage": 21.56, "elapsed_time": "9:07:14", "remaining_time": "1 day, 9:10:40", "throughput": 333.0, "total_tokens": 10933696} {"current_steps": 8630, "total_steps": 40000, "loss": 0.0904, "lr": 0.26685064460825547, "epoch": 0.4216646715364132, "percentage": 21.57, "elapsed_time": "9:07:17", "remaining_time": "1 day, 9:09:23", "throughput": 333.15, "total_tokens": 10939776} {"current_steps": 8635, "total_steps": 40000, "loss": 0.0609, "lr": 0.26681370115596553, "epoch": 0.4219089732001075, "percentage": 21.59, "elapsed_time": "9:07:20", "remaining_time": "1 day, 9:08:06", "throughput": 333.3, "total_tokens": 10945760} {"current_steps": 8640, "total_steps": 40000, "loss": 0.0639, "lr": 0.26677673968953497, "epoch": 0.42215327486380183, "percentage": 21.6, "elapsed_time": "9:07:23", "remaining_time": "1 day, 9:06:48", "throughput": 333.46, "total_tokens": 10951840} {"current_steps": 8645, "total_steps": 40000, "loss": 0.0603, "lr": 0.2667397602146636, "epoch": 0.42239757652749615, "percentage": 21.61, "elapsed_time": "9:07:26", "remaining_time": "1 day, 9:05:32", "throughput": 333.62, "total_tokens": 10958272} {"current_steps": 8650, "total_steps": 40000, "loss": 0.0615, "lr": 0.2667027627370542, "epoch": 0.4226418781911905, "percentage": 21.62, "elapsed_time": "9:07:29", "remaining_time": "1 day, 9:04:15", "throughput": 333.78, "total_tokens": 10964480} {"current_steps": 8655, "total_steps": 40000, "loss": 0.0734, "lr": 0.26666574726241216, "epoch": 0.4228861798548848, "percentage": 21.64, "elapsed_time": "9:07:32", "remaining_time": "1 day, 9:02:59", "throughput": 333.95, "total_tokens": 10970976} {"current_steps": 8660, "total_steps": 40000, "loss": 0.0995, "lr": 0.2666287137964458, "epoch": 0.4231304815185791, "percentage": 21.65, "elapsed_time": "9:07:35", "remaining_time": "1 day, 9:01:42", "throughput": 334.1, "total_tokens": 10976960} {"current_steps": 8665, "total_steps": 40000, "loss": 0.0853, "lr": 0.26659166234486614, "epoch": 0.42337478318227345, "percentage": 21.66, "elapsed_time": "9:07:38", "remaining_time": "1 day, 9:00:25", "throughput": 334.25, "total_tokens": 10982912} {"current_steps": 8670, "total_steps": 40000, "loss": 0.0857, "lr": 0.2665545929133869, "epoch": 0.4236190848459678, "percentage": 21.68, "elapsed_time": "9:07:41", "remaining_time": "1 day, 8:59:09", "throughput": 334.42, "total_tokens": 10989472} {"current_steps": 8675, "total_steps": 40000, "loss": 0.0791, "lr": 0.2665175055077248, "epoch": 0.42386338650966215, "percentage": 21.69, "elapsed_time": "9:07:44", "remaining_time": "1 day, 8:57:53", "throughput": 334.58, "total_tokens": 10995904} {"current_steps": 8680, "total_steps": 40000, "loss": 0.0728, "lr": 0.2664804001335991, "epoch": 0.4241076881733565, "percentage": 21.7, "elapsed_time": "9:07:48", "remaining_time": "1 day, 8:56:37", "throughput": 334.76, "total_tokens": 11002784} {"current_steps": 8685, "total_steps": 40000, "loss": 0.0465, "lr": 0.26644327679673185, "epoch": 0.4243519898370508, "percentage": 21.71, "elapsed_time": "9:07:51", "remaining_time": "1 day, 8:55:21", "throughput": 334.93, "total_tokens": 11009568} {"current_steps": 8690, "total_steps": 40000, "loss": 0.0608, "lr": 0.26640613550284803, "epoch": 0.4245962915007451, "percentage": 21.73, "elapsed_time": "9:07:54", "remaining_time": "1 day, 8:54:06", "throughput": 335.1, "total_tokens": 11016288} {"current_steps": 8695, "total_steps": 40000, "loss": 0.0775, "lr": 0.26636897625767525, "epoch": 0.42484059316443945, "percentage": 21.74, "elapsed_time": "9:07:57", "remaining_time": "1 day, 8:52:50", "throughput": 335.27, "total_tokens": 11022880} {"current_steps": 8700, "total_steps": 40000, "loss": 0.0755, "lr": 0.266331799066944, "epoch": 0.4250848948281338, "percentage": 21.75, "elapsed_time": "9:08:00", "remaining_time": "1 day, 8:51:34", "throughput": 335.42, "total_tokens": 11028704} {"current_steps": 8705, "total_steps": 40000, "loss": 0.069, "lr": 0.2662946039363874, "epoch": 0.4253291964918281, "percentage": 21.76, "elapsed_time": "9:08:03", "remaining_time": "1 day, 8:50:18", "throughput": 335.57, "total_tokens": 11034656} {"current_steps": 8710, "total_steps": 40000, "loss": 0.0492, "lr": 0.2662573908717414, "epoch": 0.4255734981555224, "percentage": 21.77, "elapsed_time": "9:08:06", "remaining_time": "1 day, 8:49:02", "throughput": 335.72, "total_tokens": 11040768} {"current_steps": 8715, "total_steps": 40000, "loss": 0.0816, "lr": 0.2662201598787447, "epoch": 0.42581779981921675, "percentage": 21.79, "elapsed_time": "9:08:09", "remaining_time": "1 day, 8:47:46", "throughput": 335.88, "total_tokens": 11046976} {"current_steps": 8720, "total_steps": 40000, "loss": 0.0903, "lr": 0.2661829109631389, "epoch": 0.42606210148291107, "percentage": 21.8, "elapsed_time": "9:08:12", "remaining_time": "1 day, 8:46:31", "throughput": 336.04, "total_tokens": 11053408} {"current_steps": 8725, "total_steps": 40000, "loss": 0.0516, "lr": 0.26614564413066816, "epoch": 0.42630640314660545, "percentage": 21.81, "elapsed_time": "9:08:15", "remaining_time": "1 day, 8:45:15", "throughput": 336.21, "total_tokens": 11059776} {"current_steps": 8730, "total_steps": 40000, "loss": 0.0691, "lr": 0.2661083593870795, "epoch": 0.4265507048102998, "percentage": 21.82, "elapsed_time": "9:08:18", "remaining_time": "1 day, 8:44:00", "throughput": 336.35, "total_tokens": 11065664} {"current_steps": 8735, "total_steps": 40000, "loss": 0.0521, "lr": 0.26607105673812276, "epoch": 0.4267950064739941, "percentage": 21.84, "elapsed_time": "9:08:21", "remaining_time": "1 day, 8:42:44", "throughput": 336.52, "total_tokens": 11072032} {"current_steps": 8740, "total_steps": 40000, "loss": 0.0569, "lr": 0.2660337361895504, "epoch": 0.4270393081376884, "percentage": 21.85, "elapsed_time": "9:08:24", "remaining_time": "1 day, 8:41:29", "throughput": 336.67, "total_tokens": 11078208} {"current_steps": 8745, "total_steps": 40000, "loss": 0.0396, "lr": 0.26599639774711775, "epoch": 0.42728360980138275, "percentage": 21.86, "elapsed_time": "9:08:28", "remaining_time": "1 day, 8:40:14", "throughput": 336.83, "total_tokens": 11084544} {"current_steps": 8750, "total_steps": 40000, "loss": 0.0483, "lr": 0.2659590414165829, "epoch": 0.42752791146507707, "percentage": 21.88, "elapsed_time": "9:08:31", "remaining_time": "1 day, 8:38:59", "throughput": 336.99, "total_tokens": 11090848} {"current_steps": 8755, "total_steps": 40000, "loss": 0.0549, "lr": 0.2659216672037066, "epoch": 0.4277722131287714, "percentage": 21.89, "elapsed_time": "9:08:34", "remaining_time": "1 day, 8:37:44", "throughput": 337.16, "total_tokens": 11097280} {"current_steps": 8760, "total_steps": 40000, "loss": 0.0526, "lr": 0.26588427511425244, "epoch": 0.4280165147924657, "percentage": 21.9, "elapsed_time": "9:08:37", "remaining_time": "1 day, 8:36:29", "throughput": 337.32, "total_tokens": 11103712} {"current_steps": 8765, "total_steps": 40000, "loss": 0.0629, "lr": 0.26584686515398676, "epoch": 0.42826081645616004, "percentage": 21.91, "elapsed_time": "9:08:40", "remaining_time": "1 day, 8:35:15", "throughput": 337.49, "total_tokens": 11110144} {"current_steps": 8770, "total_steps": 40000, "loss": 0.1108, "lr": 0.2658094373286787, "epoch": 0.4285051181198544, "percentage": 21.93, "elapsed_time": "9:08:43", "remaining_time": "1 day, 8:34:00", "throughput": 337.64, "total_tokens": 11116128} {"current_steps": 8775, "total_steps": 40000, "loss": 0.0572, "lr": 0.2657719916441, "epoch": 0.42874941978354875, "percentage": 21.94, "elapsed_time": "9:08:46", "remaining_time": "1 day, 8:32:45", "throughput": 337.81, "total_tokens": 11122816} {"current_steps": 8780, "total_steps": 40000, "loss": 0.0825, "lr": 0.2657345281060253, "epoch": 0.42899372144724307, "percentage": 21.95, "elapsed_time": "9:08:49", "remaining_time": "1 day, 8:31:31", "throughput": 337.98, "total_tokens": 11129568} {"current_steps": 8785, "total_steps": 40000, "loss": 0.0803, "lr": 0.26569704672023203, "epoch": 0.4292380231109374, "percentage": 21.96, "elapsed_time": "9:08:52", "remaining_time": "1 day, 8:30:16", "throughput": 338.13, "total_tokens": 11135584} {"current_steps": 8790, "total_steps": 40000, "loss": 0.0363, "lr": 0.26565954749250015, "epoch": 0.4294823247746317, "percentage": 21.98, "elapsed_time": "9:08:56", "remaining_time": "1 day, 8:29:03", "throughput": 338.33, "total_tokens": 11143232} {"current_steps": 8795, "total_steps": 40000, "loss": 0.0767, "lr": 0.2656220304286126, "epoch": 0.42972662643832604, "percentage": 21.99, "elapsed_time": "9:08:59", "remaining_time": "1 day, 8:27:49", "throughput": 338.5, "total_tokens": 11149856} {"current_steps": 8800, "total_steps": 40000, "loss": 0.0868, "lr": 0.265584495534355, "epoch": 0.42997092810202037, "percentage": 22.0, "elapsed_time": "9:09:02", "remaining_time": "1 day, 8:26:35", "throughput": 338.65, "total_tokens": 11155840} {"current_steps": 8800, "total_steps": 40000, "eval_loss": 0.0719369500875473, "epoch": 0.42997092810202037, "percentage": 22.0, "elapsed_time": "9:19:41", "remaining_time": "1 day, 9:04:20", "throughput": 332.21, "total_tokens": 11155840} {"current_steps": 8805, "total_steps": 40000, "loss": 0.0421, "lr": 0.2655469428155156, "epoch": 0.4302152297657147, "percentage": 22.01, "elapsed_time": "9:19:44", "remaining_time": "1 day, 9:03:06", "throughput": 332.36, "total_tokens": 11162368} {"current_steps": 8810, "total_steps": 40000, "loss": 0.0687, "lr": 0.2655093722778856, "epoch": 0.430459531429409, "percentage": 22.02, "elapsed_time": "9:19:47", "remaining_time": "1 day, 9:01:51", "throughput": 332.53, "total_tokens": 11168832} {"current_steps": 8815, "total_steps": 40000, "loss": 0.0872, "lr": 0.2654717839272588, "epoch": 0.43070383309310334, "percentage": 22.04, "elapsed_time": "9:19:50", "remaining_time": "1 day, 9:00:35", "throughput": 332.68, "total_tokens": 11174976} {"current_steps": 8820, "total_steps": 40000, "loss": 0.0744, "lr": 0.2654341777694318, "epoch": 0.4309481347567977, "percentage": 22.05, "elapsed_time": "9:19:53", "remaining_time": "1 day, 8:59:19", "throughput": 332.83, "total_tokens": 11181216} {"current_steps": 8825, "total_steps": 40000, "loss": 0.0678, "lr": 0.265396553810204, "epoch": 0.43119243642049204, "percentage": 22.06, "elapsed_time": "9:19:57", "remaining_time": "1 day, 8:58:04", "throughput": 333.01, "total_tokens": 11188064} {"current_steps": 8830, "total_steps": 40000, "loss": 0.0623, "lr": 0.26535891205537737, "epoch": 0.43143673808418637, "percentage": 22.07, "elapsed_time": "9:20:00", "remaining_time": "1 day, 8:56:48", "throughput": 333.15, "total_tokens": 11193920} {"current_steps": 8835, "total_steps": 40000, "loss": 0.0694, "lr": 0.26532125251075683, "epoch": 0.4316810397478807, "percentage": 22.09, "elapsed_time": "9:20:03", "remaining_time": "1 day, 8:55:33", "throughput": 333.31, "total_tokens": 11200416} {"current_steps": 8840, "total_steps": 40000, "loss": 0.0743, "lr": 0.26528357518214996, "epoch": 0.431925341411575, "percentage": 22.1, "elapsed_time": "9:20:06", "remaining_time": "1 day, 8:54:18", "throughput": 333.48, "total_tokens": 11206880} {"current_steps": 8845, "total_steps": 40000, "loss": 0.0817, "lr": 0.26524588007536704, "epoch": 0.43216964307526934, "percentage": 22.11, "elapsed_time": "9:20:09", "remaining_time": "1 day, 8:53:03", "throughput": 333.64, "total_tokens": 11213376} {"current_steps": 8850, "total_steps": 40000, "loss": 0.0929, "lr": 0.26520816719622115, "epoch": 0.43241394473896366, "percentage": 22.12, "elapsed_time": "9:20:12", "remaining_time": "1 day, 8:51:48", "throughput": 333.8, "total_tokens": 11219840} {"current_steps": 8855, "total_steps": 40000, "loss": 0.0708, "lr": 0.2651704365505281, "epoch": 0.432658246402658, "percentage": 22.14, "elapsed_time": "9:20:15", "remaining_time": "1 day, 8:50:33", "throughput": 333.97, "total_tokens": 11226592} {"current_steps": 8860, "total_steps": 40000, "loss": 0.081, "lr": 0.26513268814410634, "epoch": 0.4329025480663523, "percentage": 22.15, "elapsed_time": "9:20:18", "remaining_time": "1 day, 8:49:18", "throughput": 334.13, "total_tokens": 11232928} {"current_steps": 8865, "total_steps": 40000, "loss": 0.0986, "lr": 0.2650949219827773, "epoch": 0.43314684973004663, "percentage": 22.16, "elapsed_time": "9:20:21", "remaining_time": "1 day, 8:48:04", "throughput": 334.29, "total_tokens": 11239456} {"current_steps": 8870, "total_steps": 40000, "loss": 0.0851, "lr": 0.26505713807236486, "epoch": 0.433391151393741, "percentage": 22.18, "elapsed_time": "9:20:25", "remaining_time": "1 day, 8:46:49", "throughput": 334.45, "total_tokens": 11246048} {"current_steps": 8875, "total_steps": 40000, "loss": 0.0675, "lr": 0.26501933641869585, "epoch": 0.43363545305743534, "percentage": 22.19, "elapsed_time": "9:20:28", "remaining_time": "1 day, 8:45:35", "throughput": 334.62, "total_tokens": 11252512} {"current_steps": 8880, "total_steps": 40000, "loss": 0.0376, "lr": 0.26498151702759976, "epoch": 0.43387975472112966, "percentage": 22.2, "elapsed_time": "9:20:31", "remaining_time": "1 day, 8:44:21", "throughput": 334.78, "total_tokens": 11259136} {"current_steps": 8885, "total_steps": 40000, "loss": 0.0691, "lr": 0.2649436799049088, "epoch": 0.434124056384824, "percentage": 22.21, "elapsed_time": "9:20:34", "remaining_time": "1 day, 8:43:06", "throughput": 334.93, "total_tokens": 11265184} {"current_steps": 8890, "total_steps": 40000, "loss": 0.054, "lr": 0.2649058250564579, "epoch": 0.4343683580485183, "percentage": 22.23, "elapsed_time": "9:20:37", "remaining_time": "1 day, 8:41:52", "throughput": 335.08, "total_tokens": 11271328} {"current_steps": 8895, "total_steps": 40000, "loss": 0.0721, "lr": 0.26486795248808476, "epoch": 0.43461265971221263, "percentage": 22.24, "elapsed_time": "9:20:40", "remaining_time": "1 day, 8:40:38", "throughput": 335.26, "total_tokens": 11278400} {"current_steps": 8900, "total_steps": 40000, "loss": 0.0873, "lr": 0.2648300622056298, "epoch": 0.43485696137590696, "percentage": 22.25, "elapsed_time": "9:20:43", "remaining_time": "1 day, 8:39:24", "throughput": 335.43, "total_tokens": 11285088} {"current_steps": 8905, "total_steps": 40000, "loss": 0.0593, "lr": 0.2647921542149363, "epoch": 0.4351012630396013, "percentage": 22.26, "elapsed_time": "9:20:46", "remaining_time": "1 day, 8:38:10", "throughput": 335.58, "total_tokens": 11291328} {"current_steps": 8910, "total_steps": 40000, "loss": 0.1208, "lr": 0.26475422852185, "epoch": 0.4353455647032956, "percentage": 22.27, "elapsed_time": "9:20:50", "remaining_time": "1 day, 8:36:56", "throughput": 335.75, "total_tokens": 11297984} {"current_steps": 8915, "total_steps": 40000, "loss": 0.0739, "lr": 0.2647162851322196, "epoch": 0.43558986636699, "percentage": 22.29, "elapsed_time": "9:20:53", "remaining_time": "1 day, 8:35:42", "throughput": 335.9, "total_tokens": 11304192} {"current_steps": 8920, "total_steps": 40000, "loss": 0.0845, "lr": 0.2646783240518964, "epoch": 0.4358341680306843, "percentage": 22.3, "elapsed_time": "9:20:56", "remaining_time": "1 day, 8:34:28", "throughput": 336.05, "total_tokens": 11310176} {"current_steps": 8925, "total_steps": 40000, "loss": 0.0787, "lr": 0.26464034528673447, "epoch": 0.43607846969437863, "percentage": 22.31, "elapsed_time": "9:20:59", "remaining_time": "1 day, 8:33:14", "throughput": 336.22, "total_tokens": 11317056} {"current_steps": 8930, "total_steps": 40000, "loss": 0.0573, "lr": 0.26460234884259065, "epoch": 0.43632277135807296, "percentage": 22.32, "elapsed_time": "9:21:02", "remaining_time": "1 day, 8:32:01", "throughput": 336.38, "total_tokens": 11323296} {"current_steps": 8935, "total_steps": 40000, "loss": 0.0798, "lr": 0.2645643347253245, "epoch": 0.4365670730217673, "percentage": 22.34, "elapsed_time": "9:21:05", "remaining_time": "1 day, 8:30:47", "throughput": 336.55, "total_tokens": 11330208} {"current_steps": 8940, "total_steps": 40000, "loss": 0.0684, "lr": 0.2645263029407982, "epoch": 0.4368113746854616, "percentage": 22.35, "elapsed_time": "9:21:08", "remaining_time": "1 day, 8:29:34", "throughput": 336.7, "total_tokens": 11336224} {"current_steps": 8945, "total_steps": 40000, "loss": 0.0599, "lr": 0.2644882534948767, "epoch": 0.43705567634915593, "percentage": 22.36, "elapsed_time": "9:21:11", "remaining_time": "1 day, 8:28:20", "throughput": 336.87, "total_tokens": 11342848} {"current_steps": 8950, "total_steps": 40000, "loss": 0.0948, "lr": 0.2644501863934278, "epoch": 0.43729997801285025, "percentage": 22.38, "elapsed_time": "9:21:14", "remaining_time": "1 day, 8:27:06", "throughput": 337.01, "total_tokens": 11348736} {"current_steps": 8955, "total_steps": 40000, "loss": 0.0542, "lr": 0.26441210164232193, "epoch": 0.4375442796765446, "percentage": 22.39, "elapsed_time": "9:21:17", "remaining_time": "1 day, 8:25:53", "throughput": 337.17, "total_tokens": 11355264} {"current_steps": 8960, "total_steps": 40000, "loss": 0.0848, "lr": 0.26437399924743216, "epoch": 0.4377885813402389, "percentage": 22.4, "elapsed_time": "9:21:20", "remaining_time": "1 day, 8:24:40", "throughput": 337.34, "total_tokens": 11361856} {"current_steps": 8965, "total_steps": 40000, "loss": 0.0705, "lr": 0.26433587921463436, "epoch": 0.4380328830039333, "percentage": 22.41, "elapsed_time": "9:21:24", "remaining_time": "1 day, 8:23:27", "throughput": 337.5, "total_tokens": 11368288} {"current_steps": 8970, "total_steps": 40000, "loss": 0.0718, "lr": 0.2642977415498072, "epoch": 0.4382771846676276, "percentage": 22.43, "elapsed_time": "9:21:27", "remaining_time": "1 day, 8:22:14", "throughput": 337.65, "total_tokens": 11374528} {"current_steps": 8975, "total_steps": 40000, "loss": 0.0746, "lr": 0.26425958625883195, "epoch": 0.43852148633132193, "percentage": 22.44, "elapsed_time": "9:21:30", "remaining_time": "1 day, 8:21:01", "throughput": 337.82, "total_tokens": 11381376} {"current_steps": 8980, "total_steps": 40000, "loss": 0.0569, "lr": 0.2642214133475926, "epoch": 0.43876578799501625, "percentage": 22.45, "elapsed_time": "9:21:33", "remaining_time": "1 day, 8:19:49", "throughput": 338.0, "total_tokens": 11388256} {"current_steps": 8985, "total_steps": 40000, "loss": 0.0544, "lr": 0.26418322282197587, "epoch": 0.4390100896587106, "percentage": 22.46, "elapsed_time": "9:21:36", "remaining_time": "1 day, 8:18:36", "throughput": 338.16, "total_tokens": 11394752} {"current_steps": 8990, "total_steps": 40000, "loss": 0.0692, "lr": 0.2641450146878714, "epoch": 0.4392543913224049, "percentage": 22.48, "elapsed_time": "9:21:39", "remaining_time": "1 day, 8:17:23", "throughput": 338.3, "total_tokens": 11400704} {"current_steps": 8995, "total_steps": 40000, "loss": 0.0733, "lr": 0.26410678895117107, "epoch": 0.4394986929860992, "percentage": 22.49, "elapsed_time": "9:21:42", "remaining_time": "1 day, 8:16:10", "throughput": 338.45, "total_tokens": 11406848} {"current_steps": 9000, "total_steps": 40000, "loss": 0.0729, "lr": 0.26406854561777, "epoch": 0.43974299464979355, "percentage": 22.5, "elapsed_time": "9:21:45", "remaining_time": "1 day, 8:14:58", "throughput": 338.62, "total_tokens": 11413440} {"current_steps": 9000, "total_steps": 40000, "eval_loss": 0.07104141265153885, "epoch": 0.43974299464979355, "percentage": 22.5, "elapsed_time": "9:32:25", "remaining_time": "1 day, 8:51:42", "throughput": 332.31, "total_tokens": 11413440} {"current_steps": 9005, "total_steps": 40000, "loss": 0.0576, "lr": 0.26403028469356576, "epoch": 0.4399872963134879, "percentage": 22.51, "elapsed_time": "9:32:29", "remaining_time": "1 day, 8:50:30", "throughput": 332.47, "total_tokens": 11420256} {"current_steps": 9010, "total_steps": 40000, "loss": 0.0857, "lr": 0.2639920061844585, "epoch": 0.4402315979771822, "percentage": 22.53, "elapsed_time": "9:32:32", "remaining_time": "1 day, 8:49:16", "throughput": 332.63, "total_tokens": 11426592} {"current_steps": 9015, "total_steps": 40000, "loss": 0.0817, "lr": 0.2639537100963515, "epoch": 0.4404758996408766, "percentage": 22.54, "elapsed_time": "9:32:36", "remaining_time": "1 day, 8:48:03", "throughput": 332.79, "total_tokens": 11433216} {"current_steps": 9020, "total_steps": 40000, "loss": 0.0793, "lr": 0.26391539643515033, "epoch": 0.4407202013045709, "percentage": 22.55, "elapsed_time": "9:32:39", "remaining_time": "1 day, 8:46:49", "throughput": 332.94, "total_tokens": 11439360} {"current_steps": 9025, "total_steps": 40000, "loss": 0.0962, "lr": 0.26387706520676346, "epoch": 0.4409645029682652, "percentage": 22.56, "elapsed_time": "9:32:42", "remaining_time": "1 day, 8:45:35", "throughput": 333.1, "total_tokens": 11445888} {"current_steps": 9030, "total_steps": 40000, "loss": 0.0934, "lr": 0.26383871641710205, "epoch": 0.44120880463195955, "percentage": 22.57, "elapsed_time": "9:32:45", "remaining_time": "1 day, 8:44:21", "throughput": 333.24, "total_tokens": 11451968} {"current_steps": 9035, "total_steps": 40000, "loss": 0.0708, "lr": 0.26380035007208, "epoch": 0.4414531062956539, "percentage": 22.59, "elapsed_time": "9:32:48", "remaining_time": "1 day, 8:43:07", "throughput": 333.39, "total_tokens": 11457952} {"current_steps": 9040, "total_steps": 40000, "loss": 0.0891, "lr": 0.26376196617761394, "epoch": 0.4416974079593482, "percentage": 22.6, "elapsed_time": "9:32:51", "remaining_time": "1 day, 8:41:53", "throughput": 333.54, "total_tokens": 11464128} {"current_steps": 9045, "total_steps": 40000, "loss": 0.0886, "lr": 0.263723564739623, "epoch": 0.4419417096230425, "percentage": 22.61, "elapsed_time": "9:32:54", "remaining_time": "1 day, 8:40:40", "throughput": 333.69, "total_tokens": 11470528} {"current_steps": 9050, "total_steps": 40000, "loss": 0.0955, "lr": 0.2636851457640293, "epoch": 0.44218601128673685, "percentage": 22.62, "elapsed_time": "9:32:57", "remaining_time": "1 day, 8:39:27", "throughput": 333.85, "total_tokens": 11477056} {"current_steps": 9055, "total_steps": 40000, "loss": 0.0789, "lr": 0.26364670925675737, "epoch": 0.44243031295043117, "percentage": 22.64, "elapsed_time": "9:33:00", "remaining_time": "1 day, 8:38:14", "throughput": 334.01, "total_tokens": 11483424} {"current_steps": 9060, "total_steps": 40000, "loss": 0.0558, "lr": 0.2636082552237347, "epoch": 0.4426746146141255, "percentage": 22.65, "elapsed_time": "9:33:03", "remaining_time": "1 day, 8:37:00", "throughput": 334.16, "total_tokens": 11489504} {"current_steps": 9065, "total_steps": 40000, "loss": 0.0581, "lr": 0.26356978367089146, "epoch": 0.4429189162778199, "percentage": 22.66, "elapsed_time": "9:33:06", "remaining_time": "1 day, 8:35:47", "throughput": 334.32, "total_tokens": 11496064} {"current_steps": 9070, "total_steps": 40000, "loss": 0.0732, "lr": 0.26353129460416036, "epoch": 0.4431632179415142, "percentage": 22.68, "elapsed_time": "9:33:09", "remaining_time": "1 day, 8:34:34", "throughput": 334.48, "total_tokens": 11502624} {"current_steps": 9075, "total_steps": 40000, "loss": 0.0488, "lr": 0.2634927880294769, "epoch": 0.4434075196052085, "percentage": 22.69, "elapsed_time": "9:33:12", "remaining_time": "1 day, 8:33:21", "throughput": 334.63, "total_tokens": 11508800} {"current_steps": 9080, "total_steps": 40000, "loss": 0.086, "lr": 0.26345426395277927, "epoch": 0.44365182126890285, "percentage": 22.7, "elapsed_time": "9:33:16", "remaining_time": "1 day, 8:32:08", "throughput": 334.78, "total_tokens": 11514976} {"current_steps": 9085, "total_steps": 40000, "loss": 0.0871, "lr": 0.2634157223800084, "epoch": 0.44389612293259717, "percentage": 22.71, "elapsed_time": "9:33:19", "remaining_time": "1 day, 8:30:55", "throughput": 334.92, "total_tokens": 11520992} {"current_steps": 9090, "total_steps": 40000, "loss": 0.089, "lr": 0.26337716331710787, "epoch": 0.4441404245962915, "percentage": 22.73, "elapsed_time": "9:33:22", "remaining_time": "1 day, 8:29:42", "throughput": 335.08, "total_tokens": 11527552} {"current_steps": 9095, "total_steps": 40000, "loss": 0.0497, "lr": 0.2633385867700239, "epoch": 0.4443847262599858, "percentage": 22.74, "elapsed_time": "9:33:25", "remaining_time": "1 day, 8:28:29", "throughput": 335.24, "total_tokens": 11533888} {"current_steps": 9100, "total_steps": 40000, "loss": 0.071, "lr": 0.2632999927447056, "epoch": 0.44462902792368014, "percentage": 22.75, "elapsed_time": "9:33:28", "remaining_time": "1 day, 8:27:17", "throughput": 335.39, "total_tokens": 11540224} {"current_steps": 9105, "total_steps": 40000, "loss": 0.0865, "lr": 0.2632613812471046, "epoch": 0.44487332958737447, "percentage": 22.76, "elapsed_time": "9:33:31", "remaining_time": "1 day, 8:26:04", "throughput": 335.54, "total_tokens": 11546336} {"current_steps": 9110, "total_steps": 40000, "loss": 0.0646, "lr": 0.2632227522831753, "epoch": 0.44511763125106885, "percentage": 22.78, "elapsed_time": "9:33:34", "remaining_time": "1 day, 8:24:51", "throughput": 335.68, "total_tokens": 11552256} {"current_steps": 9115, "total_steps": 40000, "loss": 0.0569, "lr": 0.26318410585887475, "epoch": 0.44536193291476317, "percentage": 22.79, "elapsed_time": "9:33:37", "remaining_time": "1 day, 8:23:39", "throughput": 335.85, "total_tokens": 11559008} {"current_steps": 9120, "total_steps": 40000, "loss": 0.0544, "lr": 0.2631454419801627, "epoch": 0.4456062345784575, "percentage": 22.8, "elapsed_time": "9:33:40", "remaining_time": "1 day, 8:22:27", "throughput": 336.0, "total_tokens": 11565536} {"current_steps": 9125, "total_steps": 40000, "loss": 0.0567, "lr": 0.2631067606530016, "epoch": 0.4458505362421518, "percentage": 22.81, "elapsed_time": "9:33:43", "remaining_time": "1 day, 8:21:14", "throughput": 336.14, "total_tokens": 11571360} {"current_steps": 9130, "total_steps": 40000, "loss": 0.0919, "lr": 0.2630680618833567, "epoch": 0.44609483790584614, "percentage": 22.82, "elapsed_time": "9:33:46", "remaining_time": "1 day, 8:20:02", "throughput": 336.3, "total_tokens": 11577632} {"current_steps": 9135, "total_steps": 40000, "loss": 0.0459, "lr": 0.26302934567719566, "epoch": 0.44633913956954047, "percentage": 22.84, "elapsed_time": "9:33:49", "remaining_time": "1 day, 8:18:49", "throughput": 336.42, "total_tokens": 11582976} {"current_steps": 9140, "total_steps": 40000, "loss": 0.0881, "lr": 0.2629906120404892, "epoch": 0.4465834412332348, "percentage": 22.85, "elapsed_time": "9:33:52", "remaining_time": "1 day, 8:17:38", "throughput": 336.59, "total_tokens": 11589696} {"current_steps": 9145, "total_steps": 40000, "loss": 0.027, "lr": 0.26295186097921036, "epoch": 0.4468277428969291, "percentage": 22.86, "elapsed_time": "9:33:55", "remaining_time": "1 day, 8:16:26", "throughput": 336.75, "total_tokens": 11596224} {"current_steps": 9150, "total_steps": 40000, "loss": 0.0869, "lr": 0.2629130924993351, "epoch": 0.44707204456062344, "percentage": 22.88, "elapsed_time": "9:33:59", "remaining_time": "1 day, 8:15:14", "throughput": 336.93, "total_tokens": 11603488} {"current_steps": 9155, "total_steps": 40000, "loss": 0.047, "lr": 0.2628743066068421, "epoch": 0.44731634622431776, "percentage": 22.89, "elapsed_time": "9:34:02", "remaining_time": "1 day, 8:14:02", "throughput": 337.09, "total_tokens": 11610016} {"current_steps": 9160, "total_steps": 40000, "loss": 0.0503, "lr": 0.26283550330771244, "epoch": 0.44756064788801214, "percentage": 22.9, "elapsed_time": "9:34:05", "remaining_time": "1 day, 8:12:51", "throughput": 337.24, "total_tokens": 11616448} {"current_steps": 9165, "total_steps": 40000, "loss": 0.1209, "lr": 0.2627966826079303, "epoch": 0.44780494955170647, "percentage": 22.91, "elapsed_time": "9:34:08", "remaining_time": "1 day, 8:11:39", "throughput": 337.39, "total_tokens": 11622560} {"current_steps": 9170, "total_steps": 40000, "loss": 0.0555, "lr": 0.26275784451348216, "epoch": 0.4480492512154008, "percentage": 22.93, "elapsed_time": "9:34:11", "remaining_time": "1 day, 8:10:27", "throughput": 337.53, "total_tokens": 11628512} {"current_steps": 9175, "total_steps": 40000, "loss": 0.033, "lr": 0.2627189890303574, "epoch": 0.4482935528790951, "percentage": 22.94, "elapsed_time": "9:34:14", "remaining_time": "1 day, 8:09:15", "throughput": 337.69, "total_tokens": 11635008} {"current_steps": 9180, "total_steps": 40000, "loss": 0.0563, "lr": 0.262680116164548, "epoch": 0.44853785454278944, "percentage": 22.95, "elapsed_time": "9:34:17", "remaining_time": "1 day, 8:08:04", "throughput": 337.84, "total_tokens": 11641216} {"current_steps": 9185, "total_steps": 40000, "loss": 0.0703, "lr": 0.2626412259220487, "epoch": 0.44878215620648376, "percentage": 22.96, "elapsed_time": "9:34:20", "remaining_time": "1 day, 8:06:52", "throughput": 337.99, "total_tokens": 11647456} {"current_steps": 9190, "total_steps": 40000, "loss": 0.0444, "lr": 0.2626023183088568, "epoch": 0.4490264578701781, "percentage": 22.98, "elapsed_time": "9:34:23", "remaining_time": "1 day, 8:05:41", "throughput": 338.14, "total_tokens": 11653696} {"current_steps": 9195, "total_steps": 40000, "loss": 0.0744, "lr": 0.26256339333097234, "epoch": 0.4492707595338724, "percentage": 22.99, "elapsed_time": "9:34:26", "remaining_time": "1 day, 8:04:30", "throughput": 338.3, "total_tokens": 11659936} {"current_steps": 9200, "total_steps": 40000, "loss": 0.0865, "lr": 0.2625244509943981, "epoch": 0.44951506119756673, "percentage": 23.0, "elapsed_time": "9:34:29", "remaining_time": "1 day, 8:03:19", "throughput": 338.46, "total_tokens": 11666624} {"current_steps": 9200, "total_steps": 40000, "eval_loss": 0.07761950045824051, "epoch": 0.44951506119756673, "percentage": 23.0, "elapsed_time": "9:45:08", "remaining_time": "1 day, 8:38:58", "throughput": 332.3, "total_tokens": 11666624} {"current_steps": 9205, "total_steps": 40000, "loss": 0.0512, "lr": 0.2624854913051395, "epoch": 0.44975936286126106, "percentage": 23.01, "elapsed_time": "9:45:12", "remaining_time": "1 day, 8:37:49", "throughput": 332.44, "total_tokens": 11672992} {"current_steps": 9210, "total_steps": 40000, "loss": 0.0596, "lr": 0.26244651426920446, "epoch": 0.45000366452495544, "percentage": 23.03, "elapsed_time": "9:45:16", "remaining_time": "1 day, 8:36:36", "throughput": 332.59, "total_tokens": 11679392} {"current_steps": 9215, "total_steps": 40000, "loss": 0.0733, "lr": 0.26240751989260386, "epoch": 0.45024796618864976, "percentage": 23.04, "elapsed_time": "9:45:19", "remaining_time": "1 day, 8:35:24", "throughput": 332.75, "total_tokens": 11685952} {"current_steps": 9220, "total_steps": 40000, "loss": 0.0658, "lr": 0.2623685081813511, "epoch": 0.4504922678523441, "percentage": 23.05, "elapsed_time": "9:45:22", "remaining_time": "1 day, 8:34:11", "throughput": 332.89, "total_tokens": 11691744} {"current_steps": 9225, "total_steps": 40000, "loss": 0.0448, "lr": 0.2623294791414623, "epoch": 0.4507365695160384, "percentage": 23.06, "elapsed_time": "9:45:25", "remaining_time": "1 day, 8:32:59", "throughput": 333.03, "total_tokens": 11697824} {"current_steps": 9230, "total_steps": 40000, "loss": 0.0609, "lr": 0.26229043277895614, "epoch": 0.45098087117973273, "percentage": 23.08, "elapsed_time": "9:45:28", "remaining_time": "1 day, 8:31:47", "throughput": 333.18, "total_tokens": 11704096} {"current_steps": 9235, "total_steps": 40000, "loss": 0.0518, "lr": 0.2622513690998542, "epoch": 0.45122517284342706, "percentage": 23.09, "elapsed_time": "9:45:31", "remaining_time": "1 day, 8:30:34", "throughput": 333.33, "total_tokens": 11710400} {"current_steps": 9240, "total_steps": 40000, "loss": 0.0828, "lr": 0.26221228811018044, "epoch": 0.4514694745071214, "percentage": 23.1, "elapsed_time": "9:45:34", "remaining_time": "1 day, 8:29:22", "throughput": 333.49, "total_tokens": 11716832} {"current_steps": 9245, "total_steps": 40000, "loss": 0.0504, "lr": 0.2621731898159617, "epoch": 0.4517137761708157, "percentage": 23.11, "elapsed_time": "9:45:37", "remaining_time": "1 day, 8:28:10", "throughput": 333.64, "total_tokens": 11723232} {"current_steps": 9250, "total_steps": 40000, "loss": 0.1072, "lr": 0.26213407422322743, "epoch": 0.45195807783451003, "percentage": 23.12, "elapsed_time": "9:45:40", "remaining_time": "1 day, 8:26:58", "throughput": 333.79, "total_tokens": 11729472} {"current_steps": 9255, "total_steps": 40000, "loss": 0.0995, "lr": 0.2620949413380098, "epoch": 0.4522023794982044, "percentage": 23.14, "elapsed_time": "9:45:43", "remaining_time": "1 day, 8:25:46", "throughput": 333.93, "total_tokens": 11735584} {"current_steps": 9260, "total_steps": 40000, "loss": 0.0873, "lr": 0.26205579116634353, "epoch": 0.45244668116189873, "percentage": 23.15, "elapsed_time": "9:45:46", "remaining_time": "1 day, 8:24:34", "throughput": 334.07, "total_tokens": 11741600} {"current_steps": 9265, "total_steps": 40000, "loss": 0.0818, "lr": 0.26201662371426604, "epoch": 0.45269098282559306, "percentage": 23.16, "elapsed_time": "9:45:49", "remaining_time": "1 day, 8:23:23", "throughput": 334.22, "total_tokens": 11747680} {"current_steps": 9270, "total_steps": 40000, "loss": 0.0932, "lr": 0.2619774389878175, "epoch": 0.4529352844892874, "percentage": 23.18, "elapsed_time": "9:45:52", "remaining_time": "1 day, 8:22:11", "throughput": 334.38, "total_tokens": 11754240} {"current_steps": 9275, "total_steps": 40000, "loss": 0.0669, "lr": 0.2619382369930407, "epoch": 0.4531795861529817, "percentage": 23.19, "elapsed_time": "9:45:56", "remaining_time": "1 day, 8:21:00", "throughput": 334.53, "total_tokens": 11760736} {"current_steps": 9280, "total_steps": 40000, "loss": 0.0592, "lr": 0.261899017735981, "epoch": 0.45342388781667603, "percentage": 23.2, "elapsed_time": "9:45:59", "remaining_time": "1 day, 8:19:48", "throughput": 334.68, "total_tokens": 11767200} {"current_steps": 9285, "total_steps": 40000, "loss": 0.0606, "lr": 0.2618597812226866, "epoch": 0.45366818948037035, "percentage": 23.21, "elapsed_time": "9:46:02", "remaining_time": "1 day, 8:18:37", "throughput": 334.83, "total_tokens": 11773472} {"current_steps": 9290, "total_steps": 40000, "loss": 0.0824, "lr": 0.2618205274592082, "epoch": 0.4539124911440647, "percentage": 23.23, "elapsed_time": "9:46:05", "remaining_time": "1 day, 8:17:26", "throughput": 334.99, "total_tokens": 11779904} {"current_steps": 9295, "total_steps": 40000, "loss": 0.0769, "lr": 0.2617812564515992, "epoch": 0.454156792807759, "percentage": 23.24, "elapsed_time": "9:46:08", "remaining_time": "1 day, 8:16:14", "throughput": 335.13, "total_tokens": 11785888} {"current_steps": 9300, "total_steps": 40000, "loss": 0.0494, "lr": 0.2617419682059158, "epoch": 0.4544010944714533, "percentage": 23.25, "elapsed_time": "9:46:11", "remaining_time": "1 day, 8:15:03", "throughput": 335.27, "total_tokens": 11791904} {"current_steps": 9305, "total_steps": 40000, "loss": 0.0577, "lr": 0.26170266272821663, "epoch": 0.4546453961351477, "percentage": 23.26, "elapsed_time": "9:46:14", "remaining_time": "1 day, 8:13:52", "throughput": 335.41, "total_tokens": 11798016} {"current_steps": 9310, "total_steps": 40000, "loss": 0.0701, "lr": 0.26166334002456315, "epoch": 0.45488969779884203, "percentage": 23.28, "elapsed_time": "9:46:17", "remaining_time": "1 day, 8:12:41", "throughput": 335.56, "total_tokens": 11804096} {"current_steps": 9315, "total_steps": 40000, "loss": 0.0895, "lr": 0.2616240001010194, "epoch": 0.45513399946253635, "percentage": 23.29, "elapsed_time": "9:46:20", "remaining_time": "1 day, 8:11:29", "throughput": 335.7, "total_tokens": 11809984} {"current_steps": 9320, "total_steps": 40000, "loss": 0.0552, "lr": 0.26158464296365197, "epoch": 0.4553783011262307, "percentage": 23.3, "elapsed_time": "9:46:23", "remaining_time": "1 day, 8:10:18", "throughput": 335.84, "total_tokens": 11816032} {"current_steps": 9325, "total_steps": 40000, "loss": 0.0764, "lr": 0.2615452686185304, "epoch": 0.455622602789925, "percentage": 23.31, "elapsed_time": "9:46:26", "remaining_time": "1 day, 8:09:07", "throughput": 335.99, "total_tokens": 11822272} {"current_steps": 9330, "total_steps": 40000, "loss": 0.0688, "lr": 0.26150587707172673, "epoch": 0.4558669044536193, "percentage": 23.33, "elapsed_time": "9:46:29", "remaining_time": "1 day, 8:07:56", "throughput": 336.14, "total_tokens": 11828640} {"current_steps": 9335, "total_steps": 40000, "loss": 0.1022, "lr": 0.2614664683293154, "epoch": 0.45611120611731365, "percentage": 23.34, "elapsed_time": "9:46:32", "remaining_time": "1 day, 8:06:46", "throughput": 336.29, "total_tokens": 11834848} {"current_steps": 9340, "total_steps": 40000, "loss": 0.1004, "lr": 0.26142704239737397, "epoch": 0.456355507781008, "percentage": 23.35, "elapsed_time": "9:46:35", "remaining_time": "1 day, 8:05:35", "throughput": 336.43, "total_tokens": 11840800} {"current_steps": 9345, "total_steps": 40000, "loss": 0.067, "lr": 0.26138759928198235, "epoch": 0.4565998094447023, "percentage": 23.36, "elapsed_time": "9:46:38", "remaining_time": "1 day, 8:04:24", "throughput": 336.57, "total_tokens": 11846752} {"current_steps": 9350, "total_steps": 40000, "loss": 0.052, "lr": 0.26134813898922304, "epoch": 0.4568441111083966, "percentage": 23.38, "elapsed_time": "9:46:41", "remaining_time": "1 day, 8:03:13", "throughput": 336.71, "total_tokens": 11852800} {"current_steps": 9355, "total_steps": 40000, "loss": 0.0545, "lr": 0.26130866152518145, "epoch": 0.457088412772091, "percentage": 23.39, "elapsed_time": "9:46:44", "remaining_time": "1 day, 8:02:03", "throughput": 336.86, "total_tokens": 11859232} {"current_steps": 9360, "total_steps": 40000, "loss": 0.0612, "lr": 0.2612691668959455, "epoch": 0.4573327144357853, "percentage": 23.4, "elapsed_time": "9:46:48", "remaining_time": "1 day, 8:00:53", "throughput": 337.03, "total_tokens": 11866304} {"current_steps": 9365, "total_steps": 40000, "loss": 0.1021, "lr": 0.2612296551076057, "epoch": 0.45757701609947965, "percentage": 23.41, "elapsed_time": "9:46:51", "remaining_time": "1 day, 7:59:43", "throughput": 337.18, "total_tokens": 11872640} {"current_steps": 9370, "total_steps": 40000, "loss": 0.0722, "lr": 0.26119012616625525, "epoch": 0.457821317763174, "percentage": 23.43, "elapsed_time": "9:46:54", "remaining_time": "1 day, 7:58:33", "throughput": 337.33, "total_tokens": 11878912} {"current_steps": 9375, "total_steps": 40000, "loss": 0.0394, "lr": 0.26115058007799, "epoch": 0.4580656194268683, "percentage": 23.44, "elapsed_time": "9:46:57", "remaining_time": "1 day, 7:57:23", "throughput": 337.48, "total_tokens": 11885056} {"current_steps": 9380, "total_steps": 40000, "loss": 0.0701, "lr": 0.26111101684890864, "epoch": 0.4583099210905626, "percentage": 23.45, "elapsed_time": "9:47:00", "remaining_time": "1 day, 7:56:13", "throughput": 337.64, "total_tokens": 11891648} {"current_steps": 9385, "total_steps": 40000, "loss": 0.0649, "lr": 0.26107143648511205, "epoch": 0.45855422275425695, "percentage": 23.46, "elapsed_time": "9:47:03", "remaining_time": "1 day, 7:55:02", "throughput": 337.77, "total_tokens": 11897568} {"current_steps": 9390, "total_steps": 40000, "loss": 0.0457, "lr": 0.2610318389927042, "epoch": 0.45879852441795127, "percentage": 23.47, "elapsed_time": "9:47:06", "remaining_time": "1 day, 7:53:53", "throughput": 337.93, "total_tokens": 11904192} {"current_steps": 9395, "total_steps": 40000, "loss": 0.0504, "lr": 0.26099222437779146, "epoch": 0.4590428260816456, "percentage": 23.49, "elapsed_time": "9:47:09", "remaining_time": "1 day, 7:52:43", "throughput": 338.09, "total_tokens": 11910912} {"current_steps": 9400, "total_steps": 40000, "loss": 0.0588, "lr": 0.26095259264648285, "epoch": 0.4592871277453399, "percentage": 23.5, "elapsed_time": "9:47:12", "remaining_time": "1 day, 7:51:33", "throughput": 338.24, "total_tokens": 11917248} {"current_steps": 9400, "total_steps": 40000, "eval_loss": 0.07078426331281662, "epoch": 0.4592871277453399, "percentage": 23.5, "elapsed_time": "9:57:51", "remaining_time": "1 day, 8:26:13", "throughput": 332.22, "total_tokens": 11917248} {"current_steps": 9405, "total_steps": 40000, "loss": 0.0731, "lr": 0.2609129438048902, "epoch": 0.4595314294090343, "percentage": 23.51, "elapsed_time": "9:57:55", "remaining_time": "1 day, 8:25:04", "throughput": 332.36, "total_tokens": 11923328} {"current_steps": 9410, "total_steps": 40000, "loss": 0.0881, "lr": 0.2608732778591278, "epoch": 0.4597757310727286, "percentage": 23.52, "elapsed_time": "9:57:58", "remaining_time": "1 day, 8:23:52", "throughput": 332.5, "total_tokens": 11929376} {"current_steps": 9415, "total_steps": 40000, "loss": 0.063, "lr": 0.2608335948153126, "epoch": 0.46002003273642295, "percentage": 23.54, "elapsed_time": "9:58:01", "remaining_time": "1 day, 8:22:41", "throughput": 332.64, "total_tokens": 11935648} {"current_steps": 9420, "total_steps": 40000, "loss": 0.0593, "lr": 0.26079389467956426, "epoch": 0.46026433440011727, "percentage": 23.55, "elapsed_time": "9:58:04", "remaining_time": "1 day, 8:21:30", "throughput": 332.78, "total_tokens": 11941664} {"current_steps": 9425, "total_steps": 40000, "loss": 0.0539, "lr": 0.26075417745800505, "epoch": 0.4605086360638116, "percentage": 23.56, "elapsed_time": "9:58:07", "remaining_time": "1 day, 8:20:20", "throughput": 332.93, "total_tokens": 11948000} {"current_steps": 9430, "total_steps": 40000, "loss": 0.0478, "lr": 0.26071444315675985, "epoch": 0.4607529377275059, "percentage": 23.57, "elapsed_time": "9:58:10", "remaining_time": "1 day, 8:19:09", "throughput": 333.07, "total_tokens": 11954176} {"current_steps": 9435, "total_steps": 40000, "loss": 0.0574, "lr": 0.2606746917819562, "epoch": 0.46099723939120024, "percentage": 23.59, "elapsed_time": "9:58:13", "remaining_time": "1 day, 8:17:58", "throughput": 333.23, "total_tokens": 11960704} {"current_steps": 9440, "total_steps": 40000, "loss": 0.0854, "lr": 0.2606349233397242, "epoch": 0.46124154105489457, "percentage": 23.6, "elapsed_time": "9:58:16", "remaining_time": "1 day, 8:16:48", "throughput": 333.37, "total_tokens": 11966816} {"current_steps": 9445, "total_steps": 40000, "loss": 0.0985, "lr": 0.26059513783619676, "epoch": 0.4614858427185889, "percentage": 23.61, "elapsed_time": "9:58:19", "remaining_time": "1 day, 8:15:37", "throughput": 333.51, "total_tokens": 11972992} {"current_steps": 9450, "total_steps": 40000, "loss": 0.0607, "lr": 0.26055533527750924, "epoch": 0.46173014438228327, "percentage": 23.62, "elapsed_time": "9:58:22", "remaining_time": "1 day, 8:14:26", "throughput": 333.66, "total_tokens": 11979296} {"current_steps": 9455, "total_steps": 40000, "loss": 0.0756, "lr": 0.26051551566979964, "epoch": 0.4619744460459776, "percentage": 23.64, "elapsed_time": "9:58:25", "remaining_time": "1 day, 8:13:16", "throughput": 333.8, "total_tokens": 11985536} {"current_steps": 9460, "total_steps": 40000, "loss": 0.0635, "lr": 0.26047567901920876, "epoch": 0.4622187477096719, "percentage": 23.65, "elapsed_time": "9:58:29", "remaining_time": "1 day, 8:12:06", "throughput": 333.95, "total_tokens": 11991776} {"current_steps": 9465, "total_steps": 40000, "loss": 0.0832, "lr": 0.2604358253318798, "epoch": 0.46246304937336624, "percentage": 23.66, "elapsed_time": "9:58:32", "remaining_time": "1 day, 8:10:55", "throughput": 334.09, "total_tokens": 11998016} {"current_steps": 9470, "total_steps": 40000, "loss": 0.0788, "lr": 0.26039595461395876, "epoch": 0.46270735103706057, "percentage": 23.67, "elapsed_time": "9:58:35", "remaining_time": "1 day, 8:09:45", "throughput": 334.24, "total_tokens": 12004288} {"current_steps": 9475, "total_steps": 40000, "loss": 0.0494, "lr": 0.26035606687159424, "epoch": 0.4629516527007549, "percentage": 23.69, "elapsed_time": "9:58:38", "remaining_time": "1 day, 8:08:36", "throughput": 334.4, "total_tokens": 12011232} {"current_steps": 9480, "total_steps": 40000, "loss": 0.0692, "lr": 0.26031616211093733, "epoch": 0.4631959543644492, "percentage": 23.7, "elapsed_time": "9:58:41", "remaining_time": "1 day, 8:07:26", "throughput": 334.55, "total_tokens": 12017664} {"current_steps": 9485, "total_steps": 40000, "loss": 0.0627, "lr": 0.26027624033814195, "epoch": 0.46344025602814354, "percentage": 23.71, "elapsed_time": "9:58:44", "remaining_time": "1 day, 8:06:15", "throughput": 334.69, "total_tokens": 12023616} {"current_steps": 9490, "total_steps": 40000, "loss": 0.0581, "lr": 0.2602363015593645, "epoch": 0.46368455769183786, "percentage": 23.72, "elapsed_time": "9:58:47", "remaining_time": "1 day, 8:05:05", "throughput": 334.83, "total_tokens": 12029760} {"current_steps": 9495, "total_steps": 40000, "loss": 0.1386, "lr": 0.26019634578076395, "epoch": 0.4639288593555322, "percentage": 23.74, "elapsed_time": "9:58:50", "remaining_time": "1 day, 8:03:56", "throughput": 334.99, "total_tokens": 12036512} {"current_steps": 9500, "total_steps": 40000, "loss": 0.0575, "lr": 0.26015637300850214, "epoch": 0.46417316101922657, "percentage": 23.75, "elapsed_time": "9:58:54", "remaining_time": "1 day, 8:02:47", "throughput": 335.15, "total_tokens": 12043456} {"current_steps": 9505, "total_steps": 40000, "loss": 0.0394, "lr": 0.26011638324874325, "epoch": 0.4644174626829209, "percentage": 23.76, "elapsed_time": "9:58:57", "remaining_time": "1 day, 8:01:37", "throughput": 335.31, "total_tokens": 12050176} {"current_steps": 9510, "total_steps": 40000, "loss": 0.0772, "lr": 0.2600763765076543, "epoch": 0.4646617643466152, "percentage": 23.77, "elapsed_time": "9:59:00", "remaining_time": "1 day, 8:00:27", "throughput": 335.45, "total_tokens": 12056256} {"current_steps": 9515, "total_steps": 40000, "loss": 0.0806, "lr": 0.2600363527914048, "epoch": 0.46490606601030954, "percentage": 23.79, "elapsed_time": "9:59:03", "remaining_time": "1 day, 7:59:18", "throughput": 335.6, "total_tokens": 12062528} {"current_steps": 9520, "total_steps": 40000, "loss": 0.0426, "lr": 0.25999631210616686, "epoch": 0.46515036767400386, "percentage": 23.8, "elapsed_time": "9:59:06", "remaining_time": "1 day, 7:58:08", "throughput": 335.75, "total_tokens": 12068864} {"current_steps": 9525, "total_steps": 40000, "loss": 0.0973, "lr": 0.25995625445811527, "epoch": 0.4653946693376982, "percentage": 23.81, "elapsed_time": "9:59:09", "remaining_time": "1 day, 7:56:59", "throughput": 335.9, "total_tokens": 12075360} {"current_steps": 9530, "total_steps": 40000, "loss": 0.0847, "lr": 0.2599161798534275, "epoch": 0.4656389710013925, "percentage": 23.82, "elapsed_time": "9:59:12", "remaining_time": "1 day, 7:55:49", "throughput": 336.04, "total_tokens": 12081440} {"current_steps": 9535, "total_steps": 40000, "loss": 0.0931, "lr": 0.25987608829828346, "epoch": 0.46588327266508683, "percentage": 23.84, "elapsed_time": "9:59:15", "remaining_time": "1 day, 7:54:40", "throughput": 336.17, "total_tokens": 12087328} {"current_steps": 9540, "total_steps": 40000, "loss": 0.0933, "lr": 0.25983597979886586, "epoch": 0.46612757432878116, "percentage": 23.85, "elapsed_time": "9:59:18", "remaining_time": "1 day, 7:53:31", "throughput": 336.32, "total_tokens": 12093664} {"current_steps": 9545, "total_steps": 40000, "loss": 0.0605, "lr": 0.2597958543613599, "epoch": 0.4663718759924755, "percentage": 23.86, "elapsed_time": "9:59:21", "remaining_time": "1 day, 7:52:21", "throughput": 336.47, "total_tokens": 12099968} {"current_steps": 9550, "total_steps": 40000, "loss": 0.0663, "lr": 0.25975571199195335, "epoch": 0.46661617765616986, "percentage": 23.88, "elapsed_time": "9:59:24", "remaining_time": "1 day, 7:51:12", "throughput": 336.61, "total_tokens": 12106048} {"current_steps": 9555, "total_steps": 40000, "loss": 0.0508, "lr": 0.25971555269683677, "epoch": 0.4668604793198642, "percentage": 23.89, "elapsed_time": "9:59:27", "remaining_time": "1 day, 7:50:03", "throughput": 336.76, "total_tokens": 12112352} {"current_steps": 9560, "total_steps": 40000, "loss": 0.0627, "lr": 0.25967537648220324, "epoch": 0.4671047809835585, "percentage": 23.9, "elapsed_time": "9:59:30", "remaining_time": "1 day, 7:48:54", "throughput": 336.89, "total_tokens": 12118336} {"current_steps": 9565, "total_steps": 40000, "loss": 0.0645, "lr": 0.2596351833542483, "epoch": 0.46734908264725283, "percentage": 23.91, "elapsed_time": "9:59:33", "remaining_time": "1 day, 7:47:45", "throughput": 337.03, "total_tokens": 12124352} {"current_steps": 9570, "total_steps": 40000, "loss": 0.0594, "lr": 0.25959497331917036, "epoch": 0.46759338431094716, "percentage": 23.93, "elapsed_time": "9:59:36", "remaining_time": "1 day, 7:46:36", "throughput": 337.18, "total_tokens": 12130560} {"current_steps": 9575, "total_steps": 40000, "loss": 0.1097, "lr": 0.2595547463831703, "epoch": 0.4678376859746415, "percentage": 23.94, "elapsed_time": "9:59:39", "remaining_time": "1 day, 7:45:27", "throughput": 337.33, "total_tokens": 12136960} {"current_steps": 9580, "total_steps": 40000, "loss": 0.0767, "lr": 0.25951450255245156, "epoch": 0.4680819876383358, "percentage": 23.95, "elapsed_time": "9:59:43", "remaining_time": "1 day, 7:44:19", "throughput": 337.48, "total_tokens": 12143616} {"current_steps": 9585, "total_steps": 40000, "loss": 0.0878, "lr": 0.2594742418332203, "epoch": 0.46832628930203013, "percentage": 23.96, "elapsed_time": "9:59:46", "remaining_time": "1 day, 7:43:11", "throughput": 337.63, "total_tokens": 12149984} {"current_steps": 9590, "total_steps": 40000, "loss": 0.0863, "lr": 0.2594339642316852, "epoch": 0.46857059096572445, "percentage": 23.97, "elapsed_time": "9:59:49", "remaining_time": "1 day, 7:42:02", "throughput": 337.77, "total_tokens": 12156000} {"current_steps": 9595, "total_steps": 40000, "loss": 0.0726, "lr": 0.2593936697540576, "epoch": 0.46881489262941883, "percentage": 23.99, "elapsed_time": "9:59:52", "remaining_time": "1 day, 7:40:53", "throughput": 337.91, "total_tokens": 12162208} {"current_steps": 9600, "total_steps": 40000, "loss": 0.0779, "lr": 0.2593533584065514, "epoch": 0.46905919429311316, "percentage": 24.0, "elapsed_time": "9:59:55", "remaining_time": "1 day, 7:39:45", "throughput": 338.06, "total_tokens": 12168736} {"current_steps": 9600, "total_steps": 40000, "eval_loss": 0.07239838689565659, "epoch": 0.46905919429311316, "percentage": 24.0, "elapsed_time": "10:10:35", "remaining_time": "1 day, 8:13:31", "throughput": 332.16, "total_tokens": 12168736} {"current_steps": 9605, "total_steps": 40000, "loss": 0.0664, "lr": 0.2593130301953831, "epoch": 0.4693034959568075, "percentage": 24.01, "elapsed_time": "10:10:39", "remaining_time": "1 day, 8:12:24", "throughput": 332.29, "total_tokens": 12174944} {"current_steps": 9610, "total_steps": 40000, "loss": 0.0753, "lr": 0.2592726851267718, "epoch": 0.4695477976205018, "percentage": 24.02, "elapsed_time": "10:10:42", "remaining_time": "1 day, 8:11:15", "throughput": 332.44, "total_tokens": 12181504} {"current_steps": 9615, "total_steps": 40000, "loss": 0.0533, "lr": 0.2592323232069393, "epoch": 0.46979209928419613, "percentage": 24.04, "elapsed_time": "10:10:45", "remaining_time": "1 day, 8:10:05", "throughput": 332.58, "total_tokens": 12187552} {"current_steps": 9620, "total_steps": 40000, "loss": 0.0778, "lr": 0.25919194444210986, "epoch": 0.47003640094789045, "percentage": 24.05, "elapsed_time": "10:10:48", "remaining_time": "1 day, 8:08:55", "throughput": 332.73, "total_tokens": 12193888} {"current_steps": 9625, "total_steps": 40000, "loss": 0.0816, "lr": 0.2591515488385103, "epoch": 0.4702807026115848, "percentage": 24.06, "elapsed_time": "10:10:51", "remaining_time": "1 day, 8:07:46", "throughput": 332.89, "total_tokens": 12200800} {"current_steps": 9630, "total_steps": 40000, "loss": 0.0538, "lr": 0.2591111364023704, "epoch": 0.4705250042752791, "percentage": 24.07, "elapsed_time": "10:10:54", "remaining_time": "1 day, 8:06:37", "throughput": 333.03, "total_tokens": 12207264} {"current_steps": 9635, "total_steps": 40000, "loss": 0.0728, "lr": 0.259070707139922, "epoch": 0.4707693059389734, "percentage": 24.09, "elapsed_time": "10:10:57", "remaining_time": "1 day, 8:05:28", "throughput": 333.19, "total_tokens": 12213856} {"current_steps": 9640, "total_steps": 40000, "loss": 0.1055, "lr": 0.25903026105739985, "epoch": 0.47101360760266775, "percentage": 24.1, "elapsed_time": "10:11:00", "remaining_time": "1 day, 8:04:19", "throughput": 333.34, "total_tokens": 12220480} {"current_steps": 9645, "total_steps": 40000, "loss": 0.0738, "lr": 0.2589897981610413, "epoch": 0.47125790926636213, "percentage": 24.11, "elapsed_time": "10:11:03", "remaining_time": "1 day, 8:03:09", "throughput": 333.47, "total_tokens": 12226496} {"current_steps": 9650, "total_steps": 40000, "loss": 0.0757, "lr": 0.2589493184570863, "epoch": 0.47150221093005645, "percentage": 24.12, "elapsed_time": "10:11:07", "remaining_time": "1 day, 8:02:00", "throughput": 333.62, "total_tokens": 12232768} {"current_steps": 9655, "total_steps": 40000, "loss": 0.1104, "lr": 0.25890882195177717, "epoch": 0.4717465125937508, "percentage": 24.14, "elapsed_time": "10:11:10", "remaining_time": "1 day, 8:00:51", "throughput": 333.76, "total_tokens": 12239040} {"current_steps": 9660, "total_steps": 40000, "loss": 0.0697, "lr": 0.25886830865135907, "epoch": 0.4719908142574451, "percentage": 24.15, "elapsed_time": "10:11:13", "remaining_time": "1 day, 7:59:43", "throughput": 333.92, "total_tokens": 12246144} {"current_steps": 9665, "total_steps": 40000, "loss": 0.0826, "lr": 0.25882777856207967, "epoch": 0.4722351159211394, "percentage": 24.16, "elapsed_time": "10:11:16", "remaining_time": "1 day, 7:58:34", "throughput": 334.09, "total_tokens": 12253152} {"current_steps": 9670, "total_steps": 40000, "loss": 0.0924, "lr": 0.2587872316901892, "epoch": 0.47247941758483375, "percentage": 24.18, "elapsed_time": "10:11:19", "remaining_time": "1 day, 7:57:26", "throughput": 334.23, "total_tokens": 12259488} {"current_steps": 9675, "total_steps": 40000, "loss": 0.1097, "lr": 0.25874666804194046, "epoch": 0.4727237192485281, "percentage": 24.19, "elapsed_time": "10:11:22", "remaining_time": "1 day, 7:56:17", "throughput": 334.38, "total_tokens": 12265856} {"current_steps": 9680, "total_steps": 40000, "loss": 0.0746, "lr": 0.258706087623589, "epoch": 0.4729680209122224, "percentage": 24.2, "elapsed_time": "10:11:25", "remaining_time": "1 day, 7:55:08", "throughput": 334.51, "total_tokens": 12271712} {"current_steps": 9685, "total_steps": 40000, "loss": 0.0932, "lr": 0.25866549044139264, "epoch": 0.4732123225759167, "percentage": 24.21, "elapsed_time": "10:11:28", "remaining_time": "1 day, 7:53:59", "throughput": 334.65, "total_tokens": 12277856} {"current_steps": 9690, "total_steps": 40000, "loss": 0.0929, "lr": 0.25862487650161214, "epoch": 0.47345662423961105, "percentage": 24.22, "elapsed_time": "10:11:31", "remaining_time": "1 day, 7:52:51", "throughput": 334.79, "total_tokens": 12284032} {"current_steps": 9695, "total_steps": 40000, "loss": 0.0542, "lr": 0.2585842458105106, "epoch": 0.4737009259033054, "percentage": 24.24, "elapsed_time": "10:11:35", "remaining_time": "1 day, 7:51:42", "throughput": 334.94, "total_tokens": 12290624} {"current_steps": 9700, "total_steps": 40000, "loss": 0.0502, "lr": 0.2585435983743538, "epoch": 0.47394522756699975, "percentage": 24.25, "elapsed_time": "10:11:38", "remaining_time": "1 day, 7:50:34", "throughput": 335.09, "total_tokens": 12297216} {"current_steps": 9705, "total_steps": 40000, "loss": 0.0605, "lr": 0.2585029341994101, "epoch": 0.4741895292306941, "percentage": 24.26, "elapsed_time": "10:11:41", "remaining_time": "1 day, 7:49:25", "throughput": 335.22, "total_tokens": 12303104} {"current_steps": 9710, "total_steps": 40000, "loss": 0.0841, "lr": 0.2584622532919504, "epoch": 0.4744338308943884, "percentage": 24.27, "elapsed_time": "10:11:44", "remaining_time": "1 day, 7:48:17", "throughput": 335.38, "total_tokens": 12309824} {"current_steps": 9715, "total_steps": 40000, "loss": 0.08, "lr": 0.2584215556582482, "epoch": 0.4746781325580827, "percentage": 24.29, "elapsed_time": "10:11:47", "remaining_time": "1 day, 7:47:09", "throughput": 335.52, "total_tokens": 12315936} {"current_steps": 9720, "total_steps": 40000, "loss": 0.0508, "lr": 0.25838084130457967, "epoch": 0.47492243422177705, "percentage": 24.3, "elapsed_time": "10:11:50", "remaining_time": "1 day, 7:46:01", "throughput": 335.66, "total_tokens": 12322272} {"current_steps": 9725, "total_steps": 40000, "loss": 0.0833, "lr": 0.2583401102372234, "epoch": 0.47516673588547137, "percentage": 24.31, "elapsed_time": "10:11:53", "remaining_time": "1 day, 7:44:53", "throughput": 335.81, "total_tokens": 12328800} {"current_steps": 9730, "total_steps": 40000, "loss": 0.0734, "lr": 0.2582993624624606, "epoch": 0.4754110375491657, "percentage": 24.32, "elapsed_time": "10:11:56", "remaining_time": "1 day, 7:43:45", "throughput": 335.97, "total_tokens": 12335680} {"current_steps": 9735, "total_steps": 40000, "loss": 0.0701, "lr": 0.25825859798657513, "epoch": 0.47565533921286, "percentage": 24.34, "elapsed_time": "10:11:59", "remaining_time": "1 day, 7:42:38", "throughput": 336.13, "total_tokens": 12342624} {"current_steps": 9740, "total_steps": 40000, "loss": 0.0473, "lr": 0.25821781681585343, "epoch": 0.47589964087655434, "percentage": 24.35, "elapsed_time": "10:12:03", "remaining_time": "1 day, 7:41:30", "throughput": 336.28, "total_tokens": 12349120} {"current_steps": 9745, "total_steps": 40000, "loss": 0.0456, "lr": 0.2581770189565844, "epoch": 0.4761439425402487, "percentage": 24.36, "elapsed_time": "10:12:06", "remaining_time": "1 day, 7:40:22", "throughput": 336.42, "total_tokens": 12355456} {"current_steps": 9750, "total_steps": 40000, "loss": 0.0619, "lr": 0.25813620441505963, "epoch": 0.47638824420394305, "percentage": 24.38, "elapsed_time": "10:12:09", "remaining_time": "1 day, 7:39:14", "throughput": 336.56, "total_tokens": 12361600} {"current_steps": 9755, "total_steps": 40000, "loss": 0.0792, "lr": 0.2580953731975732, "epoch": 0.47663254586763737, "percentage": 24.39, "elapsed_time": "10:12:12", "remaining_time": "1 day, 7:38:06", "throughput": 336.7, "total_tokens": 12367712} {"current_steps": 9760, "total_steps": 40000, "loss": 0.0733, "lr": 0.2580545253104218, "epoch": 0.4768768475313317, "percentage": 24.4, "elapsed_time": "10:12:15", "remaining_time": "1 day, 7:36:58", "throughput": 336.84, "total_tokens": 12373952} {"current_steps": 9765, "total_steps": 40000, "loss": 0.0794, "lr": 0.2580136607599047, "epoch": 0.477121149195026, "percentage": 24.41, "elapsed_time": "10:12:18", "remaining_time": "1 day, 7:35:51", "throughput": 336.98, "total_tokens": 12380032} {"current_steps": 9770, "total_steps": 40000, "loss": 0.0552, "lr": 0.2579727795523238, "epoch": 0.47736545085872034, "percentage": 24.43, "elapsed_time": "10:12:21", "remaining_time": "1 day, 7:34:43", "throughput": 337.12, "total_tokens": 12386240} {"current_steps": 9775, "total_steps": 40000, "loss": 0.0648, "lr": 0.25793188169398334, "epoch": 0.47760975252241467, "percentage": 24.44, "elapsed_time": "10:12:24", "remaining_time": "1 day, 7:33:36", "throughput": 337.27, "total_tokens": 12392704} {"current_steps": 9780, "total_steps": 40000, "loss": 0.0497, "lr": 0.25789096719119037, "epoch": 0.477854054186109, "percentage": 24.45, "elapsed_time": "10:12:27", "remaining_time": "1 day, 7:32:28", "throughput": 337.4, "total_tokens": 12398592} {"current_steps": 9785, "total_steps": 40000, "loss": 0.061, "lr": 0.2578500360502544, "epoch": 0.4780983558498033, "percentage": 24.46, "elapsed_time": "10:12:30", "remaining_time": "1 day, 7:31:21", "throughput": 337.54, "total_tokens": 12404800} {"current_steps": 9790, "total_steps": 40000, "loss": 0.0586, "lr": 0.2578090882774876, "epoch": 0.4783426575134977, "percentage": 24.47, "elapsed_time": "10:12:33", "remaining_time": "1 day, 7:30:13", "throughput": 337.68, "total_tokens": 12411008} {"current_steps": 9795, "total_steps": 40000, "loss": 0.0723, "lr": 0.25776812387920456, "epoch": 0.478586959177192, "percentage": 24.49, "elapsed_time": "10:12:36", "remaining_time": "1 day, 7:29:06", "throughput": 337.82, "total_tokens": 12417248} {"current_steps": 9800, "total_steps": 40000, "loss": 0.0752, "lr": 0.2577271428617225, "epoch": 0.47883126084088634, "percentage": 24.5, "elapsed_time": "10:12:39", "remaining_time": "1 day, 7:27:59", "throughput": 337.97, "total_tokens": 12423520} {"current_steps": 9800, "total_steps": 40000, "eval_loss": 0.07212045788764954, "epoch": 0.47883126084088634, "percentage": 24.5, "elapsed_time": "10:23:19", "remaining_time": "1 day, 8:00:52", "throughput": 332.18, "total_tokens": 12423520} {"current_steps": 9805, "total_steps": 40000, "loss": 0.0862, "lr": 0.25768614523136124, "epoch": 0.47907556250458067, "percentage": 24.51, "elapsed_time": "10:23:23", "remaining_time": "1 day, 7:59:46", "throughput": 332.3, "total_tokens": 12429280} {"current_steps": 9810, "total_steps": 40000, "loss": 0.0658, "lr": 0.25764513099444314, "epoch": 0.479319864168275, "percentage": 24.52, "elapsed_time": "10:23:26", "remaining_time": "1 day, 7:58:38", "throughput": 332.43, "total_tokens": 12435200} {"current_steps": 9815, "total_steps": 40000, "loss": 0.0591, "lr": 0.25760410015729307, "epoch": 0.4795641658319693, "percentage": 24.54, "elapsed_time": "10:23:29", "remaining_time": "1 day, 7:57:29", "throughput": 332.57, "total_tokens": 12441440} {"current_steps": 9820, "total_steps": 40000, "loss": 0.0892, "lr": 0.2575630527262385, "epoch": 0.47980846749566364, "percentage": 24.55, "elapsed_time": "10:23:32", "remaining_time": "1 day, 7:56:21", "throughput": 332.72, "total_tokens": 12448096} {"current_steps": 9825, "total_steps": 40000, "loss": 0.0706, "lr": 0.25752198870760945, "epoch": 0.48005276915935796, "percentage": 24.56, "elapsed_time": "10:23:36", "remaining_time": "1 day, 7:55:13", "throughput": 332.86, "total_tokens": 12454336} {"current_steps": 9830, "total_steps": 40000, "loss": 0.0479, "lr": 0.2574809081077386, "epoch": 0.4802970708230523, "percentage": 24.57, "elapsed_time": "10:23:39", "remaining_time": "1 day, 7:54:05", "throughput": 332.99, "total_tokens": 12460224} {"current_steps": 9835, "total_steps": 40000, "loss": 0.0606, "lr": 0.257439810932961, "epoch": 0.4805413724867466, "percentage": 24.59, "elapsed_time": "10:23:42", "remaining_time": "1 day, 7:52:57", "throughput": 333.13, "total_tokens": 12466336} {"current_steps": 9840, "total_steps": 40000, "loss": 0.0809, "lr": 0.2573986971896144, "epoch": 0.480785674150441, "percentage": 24.6, "elapsed_time": "10:23:45", "remaining_time": "1 day, 7:51:49", "throughput": 333.27, "total_tokens": 12472704} {"current_steps": 9845, "total_steps": 40000, "loss": 0.0735, "lr": 0.257357566884039, "epoch": 0.4810299758141353, "percentage": 24.61, "elapsed_time": "10:23:48", "remaining_time": "1 day, 7:50:41", "throughput": 333.41, "total_tokens": 12479040} {"current_steps": 9850, "total_steps": 40000, "loss": 0.0698, "lr": 0.25731642002257765, "epoch": 0.48127427747782964, "percentage": 24.62, "elapsed_time": "10:23:51", "remaining_time": "1 day, 7:49:33", "throughput": 333.55, "total_tokens": 12485376} {"current_steps": 9855, "total_steps": 40000, "loss": 0.0804, "lr": 0.25727525661157574, "epoch": 0.48151857914152396, "percentage": 24.64, "elapsed_time": "10:23:54", "remaining_time": "1 day, 7:48:26", "throughput": 333.69, "total_tokens": 12491648} {"current_steps": 9860, "total_steps": 40000, "loss": 0.0574, "lr": 0.2572340766573811, "epoch": 0.4817628808052183, "percentage": 24.65, "elapsed_time": "10:23:57", "remaining_time": "1 day, 7:47:18", "throughput": 333.84, "total_tokens": 12498304} {"current_steps": 9865, "total_steps": 40000, "loss": 0.0651, "lr": 0.25719288016634434, "epoch": 0.4820071824689126, "percentage": 24.66, "elapsed_time": "10:24:00", "remaining_time": "1 day, 7:46:11", "throughput": 333.98, "total_tokens": 12504416} {"current_steps": 9870, "total_steps": 40000, "loss": 0.0786, "lr": 0.25715166714481835, "epoch": 0.48225148413260693, "percentage": 24.68, "elapsed_time": "10:24:03", "remaining_time": "1 day, 7:45:03", "throughput": 334.13, "total_tokens": 12511264} {"current_steps": 9875, "total_steps": 40000, "loss": 0.0497, "lr": 0.2571104375991587, "epoch": 0.48249578579630126, "percentage": 24.69, "elapsed_time": "10:24:06", "remaining_time": "1 day, 7:43:56", "throughput": 334.28, "total_tokens": 12517664} {"current_steps": 9880, "total_steps": 40000, "loss": 0.0856, "lr": 0.2570691915357236, "epoch": 0.4827400874599956, "percentage": 24.7, "elapsed_time": "10:24:09", "remaining_time": "1 day, 7:42:49", "throughput": 334.42, "total_tokens": 12523808} {"current_steps": 9885, "total_steps": 40000, "loss": 0.0574, "lr": 0.2570279289608736, "epoch": 0.4829843891236899, "percentage": 24.71, "elapsed_time": "10:24:12", "remaining_time": "1 day, 7:41:41", "throughput": 334.54, "total_tokens": 12529664} {"current_steps": 9890, "total_steps": 40000, "loss": 0.0598, "lr": 0.256986649880972, "epoch": 0.4832286907873843, "percentage": 24.73, "elapsed_time": "10:24:16", "remaining_time": "1 day, 7:40:34", "throughput": 334.7, "total_tokens": 12536416} {"current_steps": 9895, "total_steps": 40000, "loss": 0.0728, "lr": 0.25694535430238447, "epoch": 0.4834729924510786, "percentage": 24.74, "elapsed_time": "10:24:19", "remaining_time": "1 day, 7:39:27", "throughput": 334.83, "total_tokens": 12542496} {"current_steps": 9900, "total_steps": 40000, "loss": 0.0862, "lr": 0.25690404223147933, "epoch": 0.48371729411477293, "percentage": 24.75, "elapsed_time": "10:24:22", "remaining_time": "1 day, 7:38:19", "throughput": 334.96, "total_tokens": 12548416} {"current_steps": 9905, "total_steps": 40000, "loss": 0.076, "lr": 0.2568627136746275, "epoch": 0.48396159577846726, "percentage": 24.76, "elapsed_time": "10:24:25", "remaining_time": "1 day, 7:37:12", "throughput": 335.1, "total_tokens": 12554496} {"current_steps": 9910, "total_steps": 40000, "loss": 0.0622, "lr": 0.25682136863820226, "epoch": 0.4842058974421616, "percentage": 24.77, "elapsed_time": "10:24:28", "remaining_time": "1 day, 7:36:05", "throughput": 335.23, "total_tokens": 12560544} {"current_steps": 9915, "total_steps": 40000, "loss": 0.057, "lr": 0.25678000712857957, "epoch": 0.4844501991058559, "percentage": 24.79, "elapsed_time": "10:24:31", "remaining_time": "1 day, 7:34:58", "throughput": 335.37, "total_tokens": 12566848} {"current_steps": 9920, "total_steps": 40000, "loss": 0.095, "lr": 0.2567386291521379, "epoch": 0.48469450076955023, "percentage": 24.8, "elapsed_time": "10:24:34", "remaining_time": "1 day, 7:33:51", "throughput": 335.5, "total_tokens": 12572640} {"current_steps": 9925, "total_steps": 40000, "loss": 0.0604, "lr": 0.2566972347152583, "epoch": 0.48493880243324455, "percentage": 24.81, "elapsed_time": "10:24:37", "remaining_time": "1 day, 7:32:44", "throughput": 335.65, "total_tokens": 12579296} {"current_steps": 9930, "total_steps": 40000, "loss": 0.0832, "lr": 0.2566558238243242, "epoch": 0.4851831040969389, "percentage": 24.82, "elapsed_time": "10:24:40", "remaining_time": "1 day, 7:31:38", "throughput": 335.78, "total_tokens": 12585344} {"current_steps": 9935, "total_steps": 40000, "loss": 0.0576, "lr": 0.25661439648572176, "epoch": 0.48542740576063326, "percentage": 24.84, "elapsed_time": "10:24:43", "remaining_time": "1 day, 7:30:31", "throughput": 335.92, "total_tokens": 12591584} {"current_steps": 9940, "total_steps": 40000, "loss": 0.0658, "lr": 0.25657295270583963, "epoch": 0.4856717074243276, "percentage": 24.85, "elapsed_time": "10:24:46", "remaining_time": "1 day, 7:29:24", "throughput": 336.06, "total_tokens": 12597728} {"current_steps": 9945, "total_steps": 40000, "loss": 0.1149, "lr": 0.25653149249106894, "epoch": 0.4859160090880219, "percentage": 24.86, "elapsed_time": "10:24:49", "remaining_time": "1 day, 7:28:18", "throughput": 336.19, "total_tokens": 12603744} {"current_steps": 9950, "total_steps": 40000, "loss": 0.0529, "lr": 0.25649001584780323, "epoch": 0.48616031075171623, "percentage": 24.88, "elapsed_time": "10:24:52", "remaining_time": "1 day, 7:27:11", "throughput": 336.33, "total_tokens": 12610080} {"current_steps": 9955, "total_steps": 40000, "loss": 0.0949, "lr": 0.2564485227824389, "epoch": 0.48640461241541055, "percentage": 24.89, "elapsed_time": "10:24:55", "remaining_time": "1 day, 7:26:04", "throughput": 336.46, "total_tokens": 12615872} {"current_steps": 9960, "total_steps": 40000, "loss": 0.1079, "lr": 0.25640701330137466, "epoch": 0.4866489140791049, "percentage": 24.9, "elapsed_time": "10:24:58", "remaining_time": "1 day, 7:24:58", "throughput": 336.6, "total_tokens": 12622048} {"current_steps": 9965, "total_steps": 40000, "loss": 0.0633, "lr": 0.2563654874110117, "epoch": 0.4868932157427992, "percentage": 24.91, "elapsed_time": "10:25:01", "remaining_time": "1 day, 7:23:52", "throughput": 336.75, "total_tokens": 12628672} {"current_steps": 9970, "total_steps": 40000, "loss": 0.0609, "lr": 0.256323945117754, "epoch": 0.4871375174064935, "percentage": 24.93, "elapsed_time": "10:25:04", "remaining_time": "1 day, 7:22:46", "throughput": 336.89, "total_tokens": 12634944} {"current_steps": 9975, "total_steps": 40000, "loss": 0.0816, "lr": 0.2562823864280078, "epoch": 0.48738181907018785, "percentage": 24.94, "elapsed_time": "10:25:08", "remaining_time": "1 day, 7:21:40", "throughput": 337.03, "total_tokens": 12641312} {"current_steps": 9980, "total_steps": 40000, "loss": 0.0849, "lr": 0.25624081134818194, "epoch": 0.4876261207338822, "percentage": 24.95, "elapsed_time": "10:25:11", "remaining_time": "1 day, 7:20:34", "throughput": 337.17, "total_tokens": 12647808} {"current_steps": 9985, "total_steps": 40000, "loss": 0.0541, "lr": 0.2561992198846879, "epoch": 0.48787042239757655, "percentage": 24.96, "elapsed_time": "10:25:14", "remaining_time": "1 day, 7:19:28", "throughput": 337.33, "total_tokens": 12654592} {"current_steps": 9990, "total_steps": 40000, "loss": 0.0856, "lr": 0.25615761204393955, "epoch": 0.4881147240612709, "percentage": 24.98, "elapsed_time": "10:25:17", "remaining_time": "1 day, 7:18:22", "throughput": 337.47, "total_tokens": 12661216} {"current_steps": 9995, "total_steps": 40000, "loss": 0.0528, "lr": 0.2561159878323534, "epoch": 0.4883590257249652, "percentage": 24.99, "elapsed_time": "10:25:20", "remaining_time": "1 day, 7:17:16", "throughput": 337.62, "total_tokens": 12667744} {"current_steps": 10000, "total_steps": 40000, "loss": 0.0444, "lr": 0.2560743472563483, "epoch": 0.4886033273886595, "percentage": 25.0, "elapsed_time": "10:25:23", "remaining_time": "1 day, 7:16:10", "throughput": 337.76, "total_tokens": 12673888} {"current_steps": 10000, "total_steps": 40000, "eval_loss": 0.07422532886266708, "epoch": 0.4886033273886595, "percentage": 25.0, "elapsed_time": "10:36:03", "remaining_time": "1 day, 7:48:09", "throughput": 332.1, "total_tokens": 12673888} {"current_steps": 10005, "total_steps": 40000, "loss": 0.0991, "lr": 0.25603269032234593, "epoch": 0.48884762905235385, "percentage": 25.01, "elapsed_time": "10:36:07", "remaining_time": "1 day, 7:47:04", "throughput": 332.24, "total_tokens": 12680736} {"current_steps": 10010, "total_steps": 40000, "loss": 0.0947, "lr": 0.2559910170367702, "epoch": 0.4890919307160482, "percentage": 25.02, "elapsed_time": "10:36:10", "remaining_time": "1 day, 7:45:57", "throughput": 332.38, "total_tokens": 12687008} {"current_steps": 10015, "total_steps": 40000, "loss": 0.0708, "lr": 0.2559493274060477, "epoch": 0.4893362323797425, "percentage": 25.04, "elapsed_time": "10:36:13", "remaining_time": "1 day, 7:44:50", "throughput": 332.52, "total_tokens": 12693408} {"current_steps": 10020, "total_steps": 40000, "loss": 0.0876, "lr": 0.2559076214366074, "epoch": 0.4895805340434368, "percentage": 25.05, "elapsed_time": "10:36:16", "remaining_time": "1 day, 7:43:43", "throughput": 332.66, "total_tokens": 12699520} {"current_steps": 10025, "total_steps": 40000, "loss": 0.0742, "lr": 0.25586589913488106, "epoch": 0.48982483570713115, "percentage": 25.06, "elapsed_time": "10:36:19", "remaining_time": "1 day, 7:42:36", "throughput": 332.78, "total_tokens": 12705376} {"current_steps": 10030, "total_steps": 40000, "loss": 0.0767, "lr": 0.2558241605073026, "epoch": 0.49006913737082547, "percentage": 25.07, "elapsed_time": "10:36:22", "remaining_time": "1 day, 7:41:30", "throughput": 332.92, "total_tokens": 12711808} {"current_steps": 10035, "total_steps": 40000, "loss": 0.0774, "lr": 0.25578240556030873, "epoch": 0.49031343903451985, "percentage": 25.09, "elapsed_time": "10:36:25", "remaining_time": "1 day, 7:40:23", "throughput": 333.06, "total_tokens": 12718048} {"current_steps": 10040, "total_steps": 40000, "loss": 0.0573, "lr": 0.2557406343003386, "epoch": 0.4905577406982142, "percentage": 25.1, "elapsed_time": "10:36:28", "remaining_time": "1 day, 7:39:16", "throughput": 333.19, "total_tokens": 12724192} {"current_steps": 10045, "total_steps": 40000, "loss": 0.0397, "lr": 0.25569884673383375, "epoch": 0.4908020423619085, "percentage": 25.11, "elapsed_time": "10:36:31", "remaining_time": "1 day, 7:38:10", "throughput": 333.33, "total_tokens": 12730432} {"current_steps": 10050, "total_steps": 40000, "loss": 0.0904, "lr": 0.25565704286723856, "epoch": 0.4910463440256028, "percentage": 25.12, "elapsed_time": "10:36:34", "remaining_time": "1 day, 7:37:03", "throughput": 333.47, "total_tokens": 12736704} {"current_steps": 10055, "total_steps": 40000, "loss": 0.0848, "lr": 0.25561522270699955, "epoch": 0.49129064568929715, "percentage": 25.14, "elapsed_time": "10:36:37", "remaining_time": "1 day, 7:35:57", "throughput": 333.6, "total_tokens": 12742752} {"current_steps": 10060, "total_steps": 40000, "loss": 0.082, "lr": 0.25557338625956594, "epoch": 0.49153494735299147, "percentage": 25.15, "elapsed_time": "10:36:40", "remaining_time": "1 day, 7:34:50", "throughput": 333.73, "total_tokens": 12748896} {"current_steps": 10065, "total_steps": 40000, "loss": 0.112, "lr": 0.25553153353138947, "epoch": 0.4917792490166858, "percentage": 25.16, "elapsed_time": "10:36:43", "remaining_time": "1 day, 7:33:44", "throughput": 333.87, "total_tokens": 12755136} {"current_steps": 10070, "total_steps": 40000, "loss": 0.093, "lr": 0.2554896645289243, "epoch": 0.4920235506803801, "percentage": 25.17, "elapsed_time": "10:36:46", "remaining_time": "1 day, 7:32:38", "throughput": 334.01, "total_tokens": 12761536} {"current_steps": 10075, "total_steps": 40000, "loss": 0.0567, "lr": 0.2554477792586272, "epoch": 0.49226785234407444, "percentage": 25.19, "elapsed_time": "10:36:49", "remaining_time": "1 day, 7:31:32", "throughput": 334.15, "total_tokens": 12767968} {"current_steps": 10080, "total_steps": 40000, "loss": 0.0727, "lr": 0.25540587772695744, "epoch": 0.49251215400776877, "percentage": 25.2, "elapsed_time": "10:36:52", "remaining_time": "1 day, 7:30:25", "throughput": 334.28, "total_tokens": 12773824} {"current_steps": 10085, "total_steps": 40000, "loss": 0.0824, "lr": 0.2553639599403767, "epoch": 0.49275645567146314, "percentage": 25.21, "elapsed_time": "10:36:55", "remaining_time": "1 day, 7:29:19", "throughput": 334.41, "total_tokens": 12779904} {"current_steps": 10090, "total_steps": 40000, "loss": 0.0418, "lr": 0.2553220259053493, "epoch": 0.49300075733515747, "percentage": 25.22, "elapsed_time": "10:36:58", "remaining_time": "1 day, 7:28:13", "throughput": 334.55, "total_tokens": 12785984} {"current_steps": 10095, "total_steps": 40000, "loss": 0.0907, "lr": 0.2552800756283419, "epoch": 0.4932450589988518, "percentage": 25.24, "elapsed_time": "10:37:01", "remaining_time": "1 day, 7:27:07", "throughput": 334.68, "total_tokens": 12792224} {"current_steps": 10100, "total_steps": 40000, "loss": 0.086, "lr": 0.25523810911582373, "epoch": 0.4934893606625461, "percentage": 25.25, "elapsed_time": "10:37:05", "remaining_time": "1 day, 7:26:01", "throughput": 334.82, "total_tokens": 12798432} {"current_steps": 10105, "total_steps": 40000, "loss": 0.0604, "lr": 0.25519612637426675, "epoch": 0.49373366232624044, "percentage": 25.26, "elapsed_time": "10:37:08", "remaining_time": "1 day, 7:24:55", "throughput": 334.96, "total_tokens": 12804896} {"current_steps": 10110, "total_steps": 40000, "loss": 0.0818, "lr": 0.25515412741014504, "epoch": 0.49397796398993477, "percentage": 25.27, "elapsed_time": "10:37:11", "remaining_time": "1 day, 7:23:49", "throughput": 335.1, "total_tokens": 12811200} {"current_steps": 10115, "total_steps": 40000, "loss": 0.0613, "lr": 0.2551121122299355, "epoch": 0.4942222656536291, "percentage": 25.29, "elapsed_time": "10:37:14", "remaining_time": "1 day, 7:22:44", "throughput": 335.23, "total_tokens": 12817472} {"current_steps": 10120, "total_steps": 40000, "loss": 0.0446, "lr": 0.2550700808401173, "epoch": 0.4944665673173234, "percentage": 25.3, "elapsed_time": "10:37:17", "remaining_time": "1 day, 7:21:38", "throughput": 335.38, "total_tokens": 12823968} {"current_steps": 10125, "total_steps": 40000, "loss": 0.0836, "lr": 0.2550280332471722, "epoch": 0.49471086898101774, "percentage": 25.31, "elapsed_time": "10:37:20", "remaining_time": "1 day, 7:20:32", "throughput": 335.5, "total_tokens": 12829664} {"current_steps": 10130, "total_steps": 40000, "loss": 0.0736, "lr": 0.2549859694575845, "epoch": 0.4949551706447121, "percentage": 25.32, "elapsed_time": "10:37:23", "remaining_time": "1 day, 7:19:27", "throughput": 335.64, "total_tokens": 12835904} {"current_steps": 10135, "total_steps": 40000, "loss": 0.0465, "lr": 0.254943889477841, "epoch": 0.49519947230840644, "percentage": 25.34, "elapsed_time": "10:37:26", "remaining_time": "1 day, 7:18:21", "throughput": 335.78, "total_tokens": 12842272} {"current_steps": 10140, "total_steps": 40000, "loss": 0.0577, "lr": 0.25490179331443097, "epoch": 0.49544377397210076, "percentage": 25.35, "elapsed_time": "10:37:29", "remaining_time": "1 day, 7:17:17", "throughput": 335.92, "total_tokens": 12849056} {"current_steps": 10145, "total_steps": 40000, "loss": 0.0695, "lr": 0.25485968097384615, "epoch": 0.4956880756357951, "percentage": 25.36, "elapsed_time": "10:37:32", "remaining_time": "1 day, 7:16:11", "throughput": 336.06, "total_tokens": 12855200} {"current_steps": 10150, "total_steps": 40000, "loss": 0.0557, "lr": 0.25481755246258075, "epoch": 0.4959323772994894, "percentage": 25.37, "elapsed_time": "10:37:36", "remaining_time": "1 day, 7:15:06", "throughput": 336.2, "total_tokens": 12861632} {"current_steps": 10155, "total_steps": 40000, "loss": 0.055, "lr": 0.2547754077871315, "epoch": 0.49617667896318374, "percentage": 25.39, "elapsed_time": "10:37:39", "remaining_time": "1 day, 7:14:01", "throughput": 336.34, "total_tokens": 12868256} {"current_steps": 10160, "total_steps": 40000, "loss": 0.0738, "lr": 0.25473324695399774, "epoch": 0.49642098062687806, "percentage": 25.4, "elapsed_time": "10:37:42", "remaining_time": "1 day, 7:12:56", "throughput": 336.49, "total_tokens": 12875008} {"current_steps": 10165, "total_steps": 40000, "loss": 0.0411, "lr": 0.25469106996968105, "epoch": 0.4966652822905724, "percentage": 25.41, "elapsed_time": "10:37:45", "remaining_time": "1 day, 7:11:51", "throughput": 336.63, "total_tokens": 12881152} {"current_steps": 10170, "total_steps": 40000, "loss": 0.0693, "lr": 0.2546488768406858, "epoch": 0.4969095839542667, "percentage": 25.42, "elapsed_time": "10:37:48", "remaining_time": "1 day, 7:10:46", "throughput": 336.77, "total_tokens": 12887520} {"current_steps": 10175, "total_steps": 40000, "loss": 0.0745, "lr": 0.25460666757351863, "epoch": 0.49715388561796103, "percentage": 25.44, "elapsed_time": "10:37:51", "remaining_time": "1 day, 7:09:41", "throughput": 336.9, "total_tokens": 12893696} {"current_steps": 10180, "total_steps": 40000, "loss": 0.0868, "lr": 0.25456444217468877, "epoch": 0.4973981872816554, "percentage": 25.45, "elapsed_time": "10:37:54", "remaining_time": "1 day, 7:08:36", "throughput": 337.03, "total_tokens": 12899712} {"current_steps": 10185, "total_steps": 40000, "loss": 0.0481, "lr": 0.25452220065070785, "epoch": 0.49764248894534974, "percentage": 25.46, "elapsed_time": "10:37:57", "remaining_time": "1 day, 7:07:31", "throughput": 337.17, "total_tokens": 12905920} {"current_steps": 10190, "total_steps": 40000, "loss": 0.1088, "lr": 0.2544799430080901, "epoch": 0.49788679060904406, "percentage": 25.47, "elapsed_time": "10:38:00", "remaining_time": "1 day, 7:06:26", "throughput": 337.3, "total_tokens": 12911904} {"current_steps": 10195, "total_steps": 40000, "loss": 0.1, "lr": 0.2544376692533522, "epoch": 0.4981310922727384, "percentage": 25.49, "elapsed_time": "10:38:03", "remaining_time": "1 day, 7:05:21", "throughput": 337.44, "total_tokens": 12918368} {"current_steps": 10200, "total_steps": 40000, "loss": 0.0639, "lr": 0.2543953793930132, "epoch": 0.4983753939364327, "percentage": 25.5, "elapsed_time": "10:38:06", "remaining_time": "1 day, 7:04:17", "throughput": 337.58, "total_tokens": 12924960} {"current_steps": 10200, "total_steps": 40000, "eval_loss": 0.07258762419223785, "epoch": 0.4983753939364327, "percentage": 25.5, "elapsed_time": "10:48:46", "remaining_time": "1 day, 7:35:26", "throughput": 332.04, "total_tokens": 12924960} {"current_steps": 10205, "total_steps": 40000, "loss": 0.0962, "lr": 0.2543530734335948, "epoch": 0.49861969560012703, "percentage": 25.51, "elapsed_time": "10:48:50", "remaining_time": "1 day, 7:34:22", "throughput": 332.16, "total_tokens": 12930912} {"current_steps": 10210, "total_steps": 40000, "loss": 0.0642, "lr": 0.2543107513816211, "epoch": 0.49886399726382136, "percentage": 25.52, "elapsed_time": "10:48:53", "remaining_time": "1 day, 7:33:17", "throughput": 332.3, "total_tokens": 12937408} {"current_steps": 10215, "total_steps": 40000, "loss": 0.0501, "lr": 0.25426841324361865, "epoch": 0.4991082989275157, "percentage": 25.54, "elapsed_time": "10:48:56", "remaining_time": "1 day, 7:32:11", "throughput": 332.44, "total_tokens": 12944160} {"current_steps": 10220, "total_steps": 40000, "loss": 0.0624, "lr": 0.2542260590261166, "epoch": 0.49935260059121, "percentage": 25.55, "elapsed_time": "10:48:59", "remaining_time": "1 day, 7:31:06", "throughput": 332.58, "total_tokens": 12950528} {"current_steps": 10225, "total_steps": 40000, "loss": 0.0706, "lr": 0.2541836887356465, "epoch": 0.49959690225490433, "percentage": 25.56, "elapsed_time": "10:49:02", "remaining_time": "1 day, 7:30:00", "throughput": 332.71, "total_tokens": 12956736} {"current_steps": 10230, "total_steps": 40000, "loss": 0.0529, "lr": 0.2541413023787423, "epoch": 0.4998412039185987, "percentage": 25.57, "elapsed_time": "10:49:05", "remaining_time": "1 day, 7:28:55", "throughput": 332.85, "total_tokens": 12963232} {"current_steps": 10235, "total_steps": 40000, "loss": 0.0806, "lr": 0.2540988999619405, "epoch": 0.500085505582293, "percentage": 25.59, "elapsed_time": "10:49:09", "remaining_time": "1 day, 7:27:49", "throughput": 332.99, "total_tokens": 12969504} {"current_steps": 10240, "total_steps": 40000, "loss": 0.0843, "lr": 0.25405648149178023, "epoch": 0.5003298072459873, "percentage": 25.6, "elapsed_time": "10:49:12", "remaining_time": "1 day, 7:26:44", "throughput": 333.12, "total_tokens": 12975808} {"current_steps": 10245, "total_steps": 40000, "loss": 0.0595, "lr": 0.2540140469748028, "epoch": 0.5005741089096817, "percentage": 25.61, "elapsed_time": "10:49:15", "remaining_time": "1 day, 7:25:39", "throughput": 333.26, "total_tokens": 12982400} {"current_steps": 10250, "total_steps": 40000, "loss": 0.0839, "lr": 0.25397159641755224, "epoch": 0.500818410573376, "percentage": 25.62, "elapsed_time": "10:49:18", "remaining_time": "1 day, 7:24:33", "throughput": 333.39, "total_tokens": 12988192} {"current_steps": 10255, "total_steps": 40000, "loss": 0.0919, "lr": 0.2539291298265749, "epoch": 0.5010627122370703, "percentage": 25.64, "elapsed_time": "10:49:21", "remaining_time": "1 day, 7:23:29", "throughput": 333.54, "total_tokens": 12995264} {"current_steps": 10260, "total_steps": 40000, "loss": 0.1052, "lr": 0.2538866472084197, "epoch": 0.5013070139007647, "percentage": 25.65, "elapsed_time": "10:49:24", "remaining_time": "1 day, 7:22:23", "throughput": 333.67, "total_tokens": 13001440} {"current_steps": 10265, "total_steps": 40000, "loss": 0.0972, "lr": 0.25384414856963794, "epoch": 0.501551315564459, "percentage": 25.66, "elapsed_time": "10:49:27", "remaining_time": "1 day, 7:21:18", "throughput": 333.8, "total_tokens": 13007392} {"current_steps": 10270, "total_steps": 40000, "loss": 0.059, "lr": 0.25380163391678356, "epoch": 0.5017956172281534, "percentage": 25.67, "elapsed_time": "10:49:30", "remaining_time": "1 day, 7:20:13", "throughput": 333.94, "total_tokens": 13013728} {"current_steps": 10275, "total_steps": 40000, "loss": 0.0556, "lr": 0.2537591032564127, "epoch": 0.5020399188918476, "percentage": 25.69, "elapsed_time": "10:49:33", "remaining_time": "1 day, 7:19:08", "throughput": 334.06, "total_tokens": 13019712} {"current_steps": 10280, "total_steps": 40000, "loss": 0.0809, "lr": 0.25371655659508424, "epoch": 0.502284220555542, "percentage": 25.7, "elapsed_time": "10:49:36", "remaining_time": "1 day, 7:18:03", "throughput": 334.21, "total_tokens": 13026400} {"current_steps": 10285, "total_steps": 40000, "loss": 0.0422, "lr": 0.25367399393935935, "epoch": 0.5025285222192363, "percentage": 25.71, "elapsed_time": "10:49:40", "remaining_time": "1 day, 7:16:59", "throughput": 334.36, "total_tokens": 13033408} {"current_steps": 10290, "total_steps": 40000, "loss": 0.0484, "lr": 0.25363141529580174, "epoch": 0.5027728238829307, "percentage": 25.72, "elapsed_time": "10:49:43", "remaining_time": "1 day, 7:15:54", "throughput": 334.48, "total_tokens": 13039200} {"current_steps": 10295, "total_steps": 40000, "loss": 0.0604, "lr": 0.2535888206709776, "epoch": 0.5030171255466249, "percentage": 25.74, "elapsed_time": "10:49:46", "remaining_time": "1 day, 7:14:49", "throughput": 334.62, "total_tokens": 13045504} {"current_steps": 10300, "total_steps": 40000, "loss": 0.0597, "lr": 0.2535462100714555, "epoch": 0.5032614272103193, "percentage": 25.75, "elapsed_time": "10:49:49", "remaining_time": "1 day, 7:13:45", "throughput": 334.76, "total_tokens": 13052064} {"current_steps": 10305, "total_steps": 40000, "loss": 0.0559, "lr": 0.2535035835038066, "epoch": 0.5035057288740137, "percentage": 25.76, "elapsed_time": "10:49:52", "remaining_time": "1 day, 7:12:40", "throughput": 334.89, "total_tokens": 13058080} {"current_steps": 10310, "total_steps": 40000, "loss": 0.0881, "lr": 0.2534609409746044, "epoch": 0.503750030537708, "percentage": 25.77, "elapsed_time": "10:49:55", "remaining_time": "1 day, 7:11:36", "throughput": 335.03, "total_tokens": 13064512} {"current_steps": 10315, "total_steps": 40000, "loss": 0.056, "lr": 0.253418282490425, "epoch": 0.5039943322014023, "percentage": 25.79, "elapsed_time": "10:49:58", "remaining_time": "1 day, 7:10:31", "throughput": 335.15, "total_tokens": 13070368} {"current_steps": 10320, "total_steps": 40000, "loss": 0.0646, "lr": 0.2533756080578467, "epoch": 0.5042386338650966, "percentage": 25.8, "elapsed_time": "10:50:01", "remaining_time": "1 day, 7:09:27", "throughput": 335.28, "total_tokens": 13076576} {"current_steps": 10325, "total_steps": 40000, "loss": 0.0686, "lr": 0.25333291768345056, "epoch": 0.504482935528791, "percentage": 25.81, "elapsed_time": "10:50:04", "remaining_time": "1 day, 7:08:22", "throughput": 335.43, "total_tokens": 13083168} {"current_steps": 10330, "total_steps": 40000, "loss": 0.086, "lr": 0.25329021137381996, "epoch": 0.5047272371924852, "percentage": 25.82, "elapsed_time": "10:50:07", "remaining_time": "1 day, 7:07:18", "throughput": 335.57, "total_tokens": 13089856} {"current_steps": 10335, "total_steps": 40000, "loss": 0.1024, "lr": 0.25324748913554074, "epoch": 0.5049715388561796, "percentage": 25.84, "elapsed_time": "10:50:10", "remaining_time": "1 day, 7:06:14", "throughput": 335.71, "total_tokens": 13096384} {"current_steps": 10340, "total_steps": 40000, "loss": 0.0948, "lr": 0.2532047509752013, "epoch": 0.5052158405198739, "percentage": 25.85, "elapsed_time": "10:50:14", "remaining_time": "1 day, 7:05:10", "throughput": 335.86, "total_tokens": 13103200} {"current_steps": 10345, "total_steps": 40000, "loss": 0.0659, "lr": 0.25316199689939217, "epoch": 0.5054601421835683, "percentage": 25.86, "elapsed_time": "10:50:17", "remaining_time": "1 day, 7:04:06", "throughput": 336.0, "total_tokens": 13109600} {"current_steps": 10350, "total_steps": 40000, "loss": 0.1306, "lr": 0.2531192269147068, "epoch": 0.5057044438472627, "percentage": 25.87, "elapsed_time": "10:50:20", "remaining_time": "1 day, 7:03:02", "throughput": 336.12, "total_tokens": 13115616} {"current_steps": 10355, "total_steps": 40000, "loss": 0.0616, "lr": 0.2530764410277407, "epoch": 0.5059487455109569, "percentage": 25.89, "elapsed_time": "10:50:23", "remaining_time": "1 day, 7:01:58", "throughput": 336.26, "total_tokens": 13121920} {"current_steps": 10360, "total_steps": 40000, "loss": 0.0538, "lr": 0.25303363924509203, "epoch": 0.5061930471746513, "percentage": 25.9, "elapsed_time": "10:50:26", "remaining_time": "1 day, 7:00:54", "throughput": 336.38, "total_tokens": 13127776} {"current_steps": 10365, "total_steps": 40000, "loss": 0.0795, "lr": 0.25299082157336145, "epoch": 0.5064373488383456, "percentage": 25.91, "elapsed_time": "10:50:29", "remaining_time": "1 day, 6:59:50", "throughput": 336.52, "total_tokens": 13134272} {"current_steps": 10370, "total_steps": 40000, "loss": 0.0569, "lr": 0.2529479880191519, "epoch": 0.50668165050204, "percentage": 25.92, "elapsed_time": "10:50:32", "remaining_time": "1 day, 6:58:47", "throughput": 336.65, "total_tokens": 13140512} {"current_steps": 10375, "total_steps": 40000, "loss": 0.0648, "lr": 0.2529051385890689, "epoch": 0.5069259521657342, "percentage": 25.94, "elapsed_time": "10:50:35", "remaining_time": "1 day, 6:57:43", "throughput": 336.79, "total_tokens": 13146784} {"current_steps": 10380, "total_steps": 40000, "loss": 0.0538, "lr": 0.2528622732897203, "epoch": 0.5071702538294286, "percentage": 25.95, "elapsed_time": "10:50:38", "remaining_time": "1 day, 6:56:39", "throughput": 336.93, "total_tokens": 13153376} {"current_steps": 10385, "total_steps": 40000, "loss": 0.0515, "lr": 0.25281939212771654, "epoch": 0.5074145554931229, "percentage": 25.96, "elapsed_time": "10:50:41", "remaining_time": "1 day, 6:55:35", "throughput": 337.05, "total_tokens": 13159168} {"current_steps": 10390, "total_steps": 40000, "loss": 0.0734, "lr": 0.2527764951096704, "epoch": 0.5076588571568172, "percentage": 25.97, "elapsed_time": "10:50:44", "remaining_time": "1 day, 6:54:31", "throughput": 337.18, "total_tokens": 13164928} {"current_steps": 10395, "total_steps": 40000, "loss": 0.0957, "lr": 0.2527335822421971, "epoch": 0.5079031588205115, "percentage": 25.99, "elapsed_time": "10:50:47", "remaining_time": "1 day, 6:53:27", "throughput": 337.29, "total_tokens": 13170560} {"current_steps": 10400, "total_steps": 40000, "loss": 0.0512, "lr": 0.25269065353191444, "epoch": 0.5081474604842059, "percentage": 26.0, "elapsed_time": "10:50:50", "remaining_time": "1 day, 6:52:24", "throughput": 337.42, "total_tokens": 13176640} {"current_steps": 10400, "total_steps": 40000, "eval_loss": 0.0713978111743927, "epoch": 0.5081474604842059, "percentage": 26.0, "elapsed_time": "11:01:29", "remaining_time": "1 day, 7:22:42", "throughput": 331.99, "total_tokens": 13176640} {"current_steps": 10405, "total_steps": 40000, "loss": 0.0572, "lr": 0.2526477089854425, "epoch": 0.5083917621479003, "percentage": 26.01, "elapsed_time": "11:01:33", "remaining_time": "1 day, 7:21:39", "throughput": 332.12, "total_tokens": 13182720} {"current_steps": 10410, "total_steps": 40000, "loss": 0.0386, "lr": 0.25260474860940385, "epoch": 0.5086360638115945, "percentage": 26.02, "elapsed_time": "11:01:36", "remaining_time": "1 day, 7:20:35", "throughput": 332.26, "total_tokens": 13189440} {"current_steps": 10415, "total_steps": 40000, "loss": 0.0818, "lr": 0.2525617724104236, "epoch": 0.5088803654752889, "percentage": 26.04, "elapsed_time": "11:01:39", "remaining_time": "1 day, 7:19:30", "throughput": 332.38, "total_tokens": 13195360} {"current_steps": 10420, "total_steps": 40000, "loss": 0.0719, "lr": 0.25251878039512915, "epoch": 0.5091246671389832, "percentage": 26.05, "elapsed_time": "11:01:42", "remaining_time": "1 day, 7:18:26", "throughput": 332.52, "total_tokens": 13201856} {"current_steps": 10425, "total_steps": 40000, "loss": 0.0935, "lr": 0.25247577257015047, "epoch": 0.5093689688026776, "percentage": 26.06, "elapsed_time": "11:01:45", "remaining_time": "1 day, 7:17:22", "throughput": 332.65, "total_tokens": 13208224} {"current_steps": 10430, "total_steps": 40000, "loss": 0.0543, "lr": 0.2524327489421198, "epoch": 0.5096132704663718, "percentage": 26.07, "elapsed_time": "11:01:48", "remaining_time": "1 day, 7:16:17", "throughput": 332.78, "total_tokens": 13214432} {"current_steps": 10435, "total_steps": 40000, "loss": 0.0922, "lr": 0.25238970951767203, "epoch": 0.5098575721300662, "percentage": 26.09, "elapsed_time": "11:01:51", "remaining_time": "1 day, 7:15:13", "throughput": 332.91, "total_tokens": 13220384} {"current_steps": 10440, "total_steps": 40000, "loss": 0.0551, "lr": 0.25234665430344433, "epoch": 0.5101018737937605, "percentage": 26.1, "elapsed_time": "11:01:54", "remaining_time": "1 day, 7:14:09", "throughput": 333.05, "total_tokens": 13227040} {"current_steps": 10445, "total_steps": 40000, "loss": 0.0686, "lr": 0.2523035833060764, "epoch": 0.5103461754574549, "percentage": 26.11, "elapsed_time": "11:01:58", "remaining_time": "1 day, 7:13:05", "throughput": 333.19, "total_tokens": 13233728} {"current_steps": 10450, "total_steps": 40000, "loss": 0.0806, "lr": 0.2522604965322103, "epoch": 0.5105904771211492, "percentage": 26.12, "elapsed_time": "11:02:01", "remaining_time": "1 day, 7:12:01", "throughput": 333.32, "total_tokens": 13239936} {"current_steps": 10455, "total_steps": 40000, "loss": 0.0517, "lr": 0.25221739398849047, "epoch": 0.5108347787848435, "percentage": 26.14, "elapsed_time": "11:02:04", "remaining_time": "1 day, 7:10:57", "throughput": 333.45, "total_tokens": 13246112} {"current_steps": 10460, "total_steps": 40000, "loss": 0.0456, "lr": 0.252174275681564, "epoch": 0.5110790804485379, "percentage": 26.15, "elapsed_time": "11:02:07", "remaining_time": "1 day, 7:09:53", "throughput": 333.58, "total_tokens": 13252352} {"current_steps": 10465, "total_steps": 40000, "loss": 0.0744, "lr": 0.2521311416180802, "epoch": 0.5113233821122322, "percentage": 26.16, "elapsed_time": "11:02:10", "remaining_time": "1 day, 7:08:49", "throughput": 333.71, "total_tokens": 13258496} {"current_steps": 10470, "total_steps": 40000, "loss": 0.0255, "lr": 0.25208799180469094, "epoch": 0.5115676837759265, "percentage": 26.17, "elapsed_time": "11:02:13", "remaining_time": "1 day, 7:07:45", "throughput": 333.84, "total_tokens": 13264544} {"current_steps": 10475, "total_steps": 40000, "loss": 0.0864, "lr": 0.2520448262480504, "epoch": 0.5118119854396208, "percentage": 26.19, "elapsed_time": "11:02:16", "remaining_time": "1 day, 7:06:41", "throughput": 333.97, "total_tokens": 13270816} {"current_steps": 10480, "total_steps": 40000, "loss": 0.0786, "lr": 0.25200164495481525, "epoch": 0.5120562871033152, "percentage": 26.2, "elapsed_time": "11:02:19", "remaining_time": "1 day, 7:05:37", "throughput": 334.11, "total_tokens": 13277376} {"current_steps": 10485, "total_steps": 40000, "loss": 0.0804, "lr": 0.25195844793164474, "epoch": 0.5123005887670095, "percentage": 26.21, "elapsed_time": "11:02:22", "remaining_time": "1 day, 7:04:34", "throughput": 334.26, "total_tokens": 13284384} {"current_steps": 10490, "total_steps": 40000, "loss": 0.0761, "lr": 0.2519152351852001, "epoch": 0.5125448904307038, "percentage": 26.22, "elapsed_time": "11:02:25", "remaining_time": "1 day, 7:03:31", "throughput": 334.4, "total_tokens": 13290944} {"current_steps": 10495, "total_steps": 40000, "loss": 0.0557, "lr": 0.25187200672214555, "epoch": 0.5127891920943982, "percentage": 26.24, "elapsed_time": "11:02:28", "remaining_time": "1 day, 7:02:27", "throughput": 334.53, "total_tokens": 13297024} {"current_steps": 10500, "total_steps": 40000, "loss": 0.0489, "lr": 0.2518287625491473, "epoch": 0.5130334937580925, "percentage": 26.25, "elapsed_time": "11:02:31", "remaining_time": "1 day, 7:01:24", "throughput": 334.66, "total_tokens": 13303552} {"current_steps": 10505, "total_steps": 40000, "loss": 0.0465, "lr": 0.25178550267287425, "epoch": 0.5132777954217869, "percentage": 26.26, "elapsed_time": "11:02:35", "remaining_time": "1 day, 7:00:20", "throughput": 334.8, "total_tokens": 13310016} {"current_steps": 10510, "total_steps": 40000, "loss": 0.0459, "lr": 0.2517422270999976, "epoch": 0.5135220970854811, "percentage": 26.27, "elapsed_time": "11:02:38", "remaining_time": "1 day, 6:59:17", "throughput": 334.93, "total_tokens": 13315968} {"current_steps": 10515, "total_steps": 40000, "loss": 0.0754, "lr": 0.2516989358371909, "epoch": 0.5137663987491755, "percentage": 26.29, "elapsed_time": "11:02:41", "remaining_time": "1 day, 6:58:13", "throughput": 335.07, "total_tokens": 13322656} {"current_steps": 10520, "total_steps": 40000, "loss": 0.0871, "lr": 0.25165562889113025, "epoch": 0.5140107004128698, "percentage": 26.3, "elapsed_time": "11:02:44", "remaining_time": "1 day, 6:57:10", "throughput": 335.19, "total_tokens": 13328672} {"current_steps": 10525, "total_steps": 40000, "loss": 0.0526, "lr": 0.2516123062684942, "epoch": 0.5142550020765642, "percentage": 26.31, "elapsed_time": "11:02:47", "remaining_time": "1 day, 6:56:07", "throughput": 335.32, "total_tokens": 13334912} {"current_steps": 10530, "total_steps": 40000, "loss": 0.0815, "lr": 0.25156896797596356, "epoch": 0.5144993037402584, "percentage": 26.32, "elapsed_time": "11:02:50", "remaining_time": "1 day, 6:55:04", "throughput": 335.46, "total_tokens": 13341184} {"current_steps": 10535, "total_steps": 40000, "loss": 0.0709, "lr": 0.2515256140202216, "epoch": 0.5147436054039528, "percentage": 26.34, "elapsed_time": "11:02:53", "remaining_time": "1 day, 6:54:00", "throughput": 335.58, "total_tokens": 13347008} {"current_steps": 10540, "total_steps": 40000, "loss": 0.0792, "lr": 0.25148224440795425, "epoch": 0.5149879070676471, "percentage": 26.35, "elapsed_time": "11:02:56", "remaining_time": "1 day, 6:52:57", "throughput": 335.71, "total_tokens": 13353152} {"current_steps": 10545, "total_steps": 40000, "loss": 0.0769, "lr": 0.2514388591458494, "epoch": 0.5152322087313415, "percentage": 26.36, "elapsed_time": "11:02:59", "remaining_time": "1 day, 6:51:54", "throughput": 335.84, "total_tokens": 13359424} {"current_steps": 10550, "total_steps": 40000, "loss": 0.0818, "lr": 0.2513954582405977, "epoch": 0.5154765103950358, "percentage": 26.38, "elapsed_time": "11:03:02", "remaining_time": "1 day, 6:50:51", "throughput": 335.97, "total_tokens": 13365824} {"current_steps": 10555, "total_steps": 40000, "loss": 0.0755, "lr": 0.2513520416988922, "epoch": 0.5157208120587301, "percentage": 26.39, "elapsed_time": "11:03:05", "remaining_time": "1 day, 6:49:48", "throughput": 336.1, "total_tokens": 13371808} {"current_steps": 10560, "total_steps": 40000, "loss": 0.0913, "lr": 0.2513086095274281, "epoch": 0.5159651137224245, "percentage": 26.4, "elapsed_time": "11:03:08", "remaining_time": "1 day, 6:48:46", "throughput": 336.23, "total_tokens": 13378240} {"current_steps": 10565, "total_steps": 40000, "loss": 0.0817, "lr": 0.25126516173290336, "epoch": 0.5162094153861188, "percentage": 26.41, "elapsed_time": "11:03:11", "remaining_time": "1 day, 6:47:43", "throughput": 336.37, "total_tokens": 13384736} {"current_steps": 10570, "total_steps": 40000, "loss": 0.057, "lr": 0.2512216983220181, "epoch": 0.5164537170498131, "percentage": 26.42, "elapsed_time": "11:03:14", "remaining_time": "1 day, 6:46:41", "throughput": 336.49, "total_tokens": 13390656} {"current_steps": 10575, "total_steps": 40000, "loss": 0.068, "lr": 0.25117821930147494, "epoch": 0.5166980187135074, "percentage": 26.44, "elapsed_time": "11:03:18", "remaining_time": "1 day, 6:45:38", "throughput": 336.64, "total_tokens": 13397664} {"current_steps": 10580, "total_steps": 40000, "loss": 0.0715, "lr": 0.2511347246779788, "epoch": 0.5169423203772018, "percentage": 26.45, "elapsed_time": "11:03:21", "remaining_time": "1 day, 6:44:36", "throughput": 336.79, "total_tokens": 13404864} {"current_steps": 10585, "total_steps": 40000, "loss": 0.0789, "lr": 0.25109121445823723, "epoch": 0.517186622040896, "percentage": 26.46, "elapsed_time": "11:03:24", "remaining_time": "1 day, 6:43:34", "throughput": 336.93, "total_tokens": 13411424} {"current_steps": 10590, "total_steps": 40000, "loss": 0.0708, "lr": 0.25104768864896004, "epoch": 0.5174309237045904, "percentage": 26.47, "elapsed_time": "11:03:27", "remaining_time": "1 day, 6:42:31", "throughput": 337.07, "total_tokens": 13417792} {"current_steps": 10595, "total_steps": 40000, "loss": 0.0655, "lr": 0.2510041472568594, "epoch": 0.5176752253682848, "percentage": 26.49, "elapsed_time": "11:03:30", "remaining_time": "1 day, 6:41:29", "throughput": 337.2, "total_tokens": 13424320} {"current_steps": 10600, "total_steps": 40000, "loss": 0.0672, "lr": 0.25096059028864987, "epoch": 0.5179195270319791, "percentage": 26.5, "elapsed_time": "11:03:33", "remaining_time": "1 day, 6:40:27", "throughput": 337.34, "total_tokens": 13430912} {"current_steps": 10600, "total_steps": 40000, "eval_loss": 0.07073386013507843, "epoch": 0.5179195270319791, "percentage": 26.5, "elapsed_time": "11:14:14", "remaining_time": "1 day, 7:10:02", "throughput": 332.0, "total_tokens": 13430912} {"current_steps": 10605, "total_steps": 40000, "loss": 0.0409, "lr": 0.25091701775104863, "epoch": 0.5181638286956735, "percentage": 26.51, "elapsed_time": "11:14:17", "remaining_time": "1 day, 7:09:01", "throughput": 332.12, "total_tokens": 13437024} {"current_steps": 10610, "total_steps": 40000, "loss": 0.0965, "lr": 0.250873429650775, "epoch": 0.5184081303593677, "percentage": 26.52, "elapsed_time": "11:14:20", "remaining_time": "1 day, 7:07:57", "throughput": 332.25, "total_tokens": 13443232} {"current_steps": 10615, "total_steps": 40000, "loss": 0.0677, "lr": 0.25082982599455095, "epoch": 0.5186524320230621, "percentage": 26.54, "elapsed_time": "11:14:23", "remaining_time": "1 day, 7:06:54", "throughput": 332.38, "total_tokens": 13449472} {"current_steps": 10620, "total_steps": 40000, "loss": 0.0619, "lr": 0.2507862067891006, "epoch": 0.5188967336867564, "percentage": 26.55, "elapsed_time": "11:14:26", "remaining_time": "1 day, 7:05:51", "throughput": 332.51, "total_tokens": 13455552} {"current_steps": 10625, "total_steps": 40000, "loss": 0.0817, "lr": 0.25074257204115064, "epoch": 0.5191410353504508, "percentage": 26.56, "elapsed_time": "11:14:29", "remaining_time": "1 day, 7:04:47", "throughput": 332.63, "total_tokens": 13461600} {"current_steps": 10630, "total_steps": 40000, "loss": 0.057, "lr": 0.25069892175742997, "epoch": 0.519385337014145, "percentage": 26.57, "elapsed_time": "11:14:32", "remaining_time": "1 day, 7:03:44", "throughput": 332.76, "total_tokens": 13467840} {"current_steps": 10635, "total_steps": 40000, "loss": 0.0856, "lr": 0.25065525594467014, "epoch": 0.5196296386778394, "percentage": 26.59, "elapsed_time": "11:14:35", "remaining_time": "1 day, 7:02:40", "throughput": 332.88, "total_tokens": 13473792} {"current_steps": 10640, "total_steps": 40000, "loss": 0.0763, "lr": 0.2506115746096049, "epoch": 0.5198739403415338, "percentage": 26.6, "elapsed_time": "11:14:39", "remaining_time": "1 day, 7:01:37", "throughput": 333.02, "total_tokens": 13480288} {"current_steps": 10645, "total_steps": 40000, "loss": 0.0548, "lr": 0.25056787775897055, "epoch": 0.520118242005228, "percentage": 26.61, "elapsed_time": "11:14:42", "remaining_time": "1 day, 7:00:34", "throughput": 333.14, "total_tokens": 13486368} {"current_steps": 10650, "total_steps": 40000, "loss": 0.055, "lr": 0.2505241653995056, "epoch": 0.5203625436689224, "percentage": 26.62, "elapsed_time": "11:14:45", "remaining_time": "1 day, 6:59:32", "throughput": 333.28, "total_tokens": 13492992} {"current_steps": 10655, "total_steps": 40000, "loss": 0.0425, "lr": 0.25048043753795113, "epoch": 0.5206068453326167, "percentage": 26.64, "elapsed_time": "11:14:48", "remaining_time": "1 day, 6:58:29", "throughput": 333.42, "total_tokens": 13499456} {"current_steps": 10660, "total_steps": 40000, "loss": 0.057, "lr": 0.2504366941810504, "epoch": 0.5208511469963111, "percentage": 26.65, "elapsed_time": "11:14:51", "remaining_time": "1 day, 6:57:26", "throughput": 333.55, "total_tokens": 13506048} {"current_steps": 10665, "total_steps": 40000, "loss": 0.1038, "lr": 0.2503929353355493, "epoch": 0.5210954486600053, "percentage": 26.66, "elapsed_time": "11:14:54", "remaining_time": "1 day, 6:56:23", "throughput": 333.68, "total_tokens": 13512032} {"current_steps": 10670, "total_steps": 40000, "loss": 0.0719, "lr": 0.250349161008196, "epoch": 0.5213397503236997, "percentage": 26.67, "elapsed_time": "11:14:57", "remaining_time": "1 day, 6:55:21", "throughput": 333.81, "total_tokens": 13518688} {"current_steps": 10675, "total_steps": 40000, "loss": 0.0774, "lr": 0.2503053712057409, "epoch": 0.521584051987394, "percentage": 26.69, "elapsed_time": "11:15:00", "remaining_time": "1 day, 6:54:18", "throughput": 333.93, "total_tokens": 13524608} {"current_steps": 10680, "total_steps": 40000, "loss": 0.0705, "lr": 0.25026156593493715, "epoch": 0.5218283536510884, "percentage": 26.7, "elapsed_time": "11:15:03", "remaining_time": "1 day, 6:53:16", "throughput": 334.07, "total_tokens": 13531072} {"current_steps": 10685, "total_steps": 40000, "loss": 0.0495, "lr": 0.2502177452025399, "epoch": 0.5220726553147826, "percentage": 26.71, "elapsed_time": "11:15:07", "remaining_time": "1 day, 6:52:13", "throughput": 334.21, "total_tokens": 13537792} {"current_steps": 10690, "total_steps": 40000, "loss": 0.0721, "lr": 0.25017390901530695, "epoch": 0.522316956978477, "percentage": 26.72, "elapsed_time": "11:15:10", "remaining_time": "1 day, 6:51:11", "throughput": 334.34, "total_tokens": 13544160} {"current_steps": 10695, "total_steps": 40000, "loss": 0.0528, "lr": 0.2501300573799984, "epoch": 0.5225612586421714, "percentage": 26.74, "elapsed_time": "11:15:13", "remaining_time": "1 day, 6:50:08", "throughput": 334.46, "total_tokens": 13550176} {"current_steps": 10700, "total_steps": 40000, "loss": 0.0849, "lr": 0.2500861903033766, "epoch": 0.5228055603058657, "percentage": 26.75, "elapsed_time": "11:15:16", "remaining_time": "1 day, 6:49:06", "throughput": 334.59, "total_tokens": 13556288} {"current_steps": 10705, "total_steps": 40000, "loss": 0.0814, "lr": 0.25004230779220654, "epoch": 0.52304986196956, "percentage": 26.76, "elapsed_time": "11:15:19", "remaining_time": "1 day, 6:48:03", "throughput": 334.72, "total_tokens": 13562592} {"current_steps": 10710, "total_steps": 40000, "loss": 0.0782, "lr": 0.24999840985325542, "epoch": 0.5232941636332543, "percentage": 26.77, "elapsed_time": "11:15:22", "remaining_time": "1 day, 6:47:01", "throughput": 334.85, "total_tokens": 13568960} {"current_steps": 10715, "total_steps": 40000, "loss": 0.0897, "lr": 0.24995449649329285, "epoch": 0.5235384652969487, "percentage": 26.79, "elapsed_time": "11:15:25", "remaining_time": "1 day, 6:45:59", "throughput": 334.99, "total_tokens": 13575744} {"current_steps": 10720, "total_steps": 40000, "loss": 0.0631, "lr": 0.2499105677190908, "epoch": 0.523782766960643, "percentage": 26.8, "elapsed_time": "11:15:28", "remaining_time": "1 day, 6:44:57", "throughput": 335.13, "total_tokens": 13582368} {"current_steps": 10725, "total_steps": 40000, "loss": 0.0662, "lr": 0.24986662353742364, "epoch": 0.5240270686243373, "percentage": 26.81, "elapsed_time": "11:15:31", "remaining_time": "1 day, 6:43:55", "throughput": 335.27, "total_tokens": 13588960} {"current_steps": 10730, "total_steps": 40000, "loss": 0.0555, "lr": 0.24982266395506814, "epoch": 0.5242713702880316, "percentage": 26.82, "elapsed_time": "11:15:34", "remaining_time": "1 day, 6:42:53", "throughput": 335.4, "total_tokens": 13595232} {"current_steps": 10735, "total_steps": 40000, "loss": 0.0905, "lr": 0.2497786889788034, "epoch": 0.524515671951726, "percentage": 26.84, "elapsed_time": "11:15:37", "remaining_time": "1 day, 6:41:51", "throughput": 335.52, "total_tokens": 13601248} {"current_steps": 10740, "total_steps": 40000, "loss": 0.0669, "lr": 0.24973469861541095, "epoch": 0.5247599736154204, "percentage": 26.85, "elapsed_time": "11:15:41", "remaining_time": "1 day, 6:40:49", "throughput": 335.64, "total_tokens": 13607360} {"current_steps": 10745, "total_steps": 40000, "loss": 0.055, "lr": 0.24969069287167456, "epoch": 0.5250042752791146, "percentage": 26.86, "elapsed_time": "11:15:44", "remaining_time": "1 day, 6:39:47", "throughput": 335.77, "total_tokens": 13613504} {"current_steps": 10750, "total_steps": 40000, "loss": 0.1219, "lr": 0.2496466717543806, "epoch": 0.525248576942809, "percentage": 26.88, "elapsed_time": "11:15:47", "remaining_time": "1 day, 6:38:46", "throughput": 335.9, "total_tokens": 13619744} {"current_steps": 10755, "total_steps": 40000, "loss": 0.0896, "lr": 0.24960263527031762, "epoch": 0.5254928786065033, "percentage": 26.89, "elapsed_time": "11:15:50", "remaining_time": "1 day, 6:37:44", "throughput": 336.03, "total_tokens": 13626176} {"current_steps": 10760, "total_steps": 40000, "loss": 0.0738, "lr": 0.24955858342627657, "epoch": 0.5257371802701977, "percentage": 26.9, "elapsed_time": "11:15:53", "remaining_time": "1 day, 6:36:42", "throughput": 336.17, "total_tokens": 13632704} {"current_steps": 10765, "total_steps": 40000, "loss": 0.0539, "lr": 0.24951451622905083, "epoch": 0.5259814819338919, "percentage": 26.91, "elapsed_time": "11:15:56", "remaining_time": "1 day, 6:35:41", "throughput": 336.29, "total_tokens": 13638816} {"current_steps": 10770, "total_steps": 40000, "loss": 0.069, "lr": 0.24947043368543612, "epoch": 0.5262257835975863, "percentage": 26.92, "elapsed_time": "11:15:59", "remaining_time": "1 day, 6:34:40", "throughput": 336.44, "total_tokens": 13645920} {"current_steps": 10775, "total_steps": 40000, "loss": 0.0511, "lr": 0.2494263358022305, "epoch": 0.5264700852612806, "percentage": 26.94, "elapsed_time": "11:16:02", "remaining_time": "1 day, 6:33:38", "throughput": 336.58, "total_tokens": 13652480} {"current_steps": 10780, "total_steps": 40000, "loss": 0.0771, "lr": 0.24938222258623444, "epoch": 0.526714386924975, "percentage": 26.95, "elapsed_time": "11:16:06", "remaining_time": "1 day, 6:32:37", "throughput": 336.71, "total_tokens": 13659072} {"current_steps": 10785, "total_steps": 40000, "loss": 0.0918, "lr": 0.24933809404425075, "epoch": 0.5269586885886693, "percentage": 26.96, "elapsed_time": "11:16:09", "remaining_time": "1 day, 6:31:35", "throughput": 336.84, "total_tokens": 13665088} {"current_steps": 10790, "total_steps": 40000, "loss": 0.0516, "lr": 0.24929395018308453, "epoch": 0.5272029902523636, "percentage": 26.97, "elapsed_time": "11:16:12", "remaining_time": "1 day, 6:30:34", "throughput": 336.97, "total_tokens": 13671808} {"current_steps": 10795, "total_steps": 40000, "loss": 0.0583, "lr": 0.24924979100954348, "epoch": 0.527447291916058, "percentage": 26.99, "elapsed_time": "11:16:15", "remaining_time": "1 day, 6:29:33", "throughput": 337.11, "total_tokens": 13678432} {"current_steps": 10800, "total_steps": 40000, "loss": 0.0674, "lr": 0.24920561653043735, "epoch": 0.5276915935797523, "percentage": 27.0, "elapsed_time": "11:16:18", "remaining_time": "1 day, 6:28:31", "throughput": 337.23, "total_tokens": 13684288} {"current_steps": 10800, "total_steps": 40000, "eval_loss": 0.07288419455289841, "epoch": 0.5276915935797523, "percentage": 27.0, "elapsed_time": "11:26:58", "remaining_time": "1 day, 6:57:22", "throughput": 331.99, "total_tokens": 13684288} {"current_steps": 10805, "total_steps": 40000, "loss": 0.0716, "lr": 0.24916142675257846, "epoch": 0.5279358952434466, "percentage": 27.01, "elapsed_time": "11:27:02", "remaining_time": "1 day, 6:56:23", "throughput": 332.12, "total_tokens": 13690976} {"current_steps": 10810, "total_steps": 40000, "loss": 0.052, "lr": 0.24911722168278144, "epoch": 0.5281801969071409, "percentage": 27.02, "elapsed_time": "11:27:05", "remaining_time": "1 day, 6:55:20", "throughput": 332.25, "total_tokens": 13697184} {"current_steps": 10815, "total_steps": 40000, "loss": 0.0515, "lr": 0.24907300132786328, "epoch": 0.5284244985708353, "percentage": 27.04, "elapsed_time": "11:27:08", "remaining_time": "1 day, 6:54:18", "throughput": 332.38, "total_tokens": 13703840} {"current_steps": 10820, "total_steps": 40000, "loss": 0.0845, "lr": 0.24902876569464322, "epoch": 0.5286688002345296, "percentage": 27.05, "elapsed_time": "11:27:11", "remaining_time": "1 day, 6:53:16", "throughput": 332.51, "total_tokens": 13710080} {"current_steps": 10825, "total_steps": 40000, "loss": 0.0696, "lr": 0.24898451478994305, "epoch": 0.5289131018982239, "percentage": 27.06, "elapsed_time": "11:27:14", "remaining_time": "1 day, 6:52:14", "throughput": 332.64, "total_tokens": 13716352} {"current_steps": 10830, "total_steps": 40000, "loss": 0.089, "lr": 0.2489402486205868, "epoch": 0.5291574035619182, "percentage": 27.07, "elapsed_time": "11:27:18", "remaining_time": "1 day, 6:51:12", "throughput": 332.78, "total_tokens": 13723200} {"current_steps": 10835, "total_steps": 40000, "loss": 0.08, "lr": 0.24889596719340085, "epoch": 0.5294017052256126, "percentage": 27.09, "elapsed_time": "11:27:21", "remaining_time": "1 day, 6:50:10", "throughput": 332.9, "total_tokens": 13729216} {"current_steps": 10840, "total_steps": 40000, "loss": 0.0959, "lr": 0.24885167051521392, "epoch": 0.529646006889307, "percentage": 27.1, "elapsed_time": "11:27:24", "remaining_time": "1 day, 6:49:08", "throughput": 333.03, "total_tokens": 13735776} {"current_steps": 10845, "total_steps": 40000, "loss": 0.0577, "lr": 0.24880735859285716, "epoch": 0.5298903085530012, "percentage": 27.11, "elapsed_time": "11:27:27", "remaining_time": "1 day, 6:48:06", "throughput": 333.16, "total_tokens": 13742080} {"current_steps": 10850, "total_steps": 40000, "loss": 0.0592, "lr": 0.24876303143316406, "epoch": 0.5301346102166956, "percentage": 27.12, "elapsed_time": "11:27:30", "remaining_time": "1 day, 6:47:04", "throughput": 333.28, "total_tokens": 13747840} {"current_steps": 10855, "total_steps": 40000, "loss": 0.072, "lr": 0.24871868904297031, "epoch": 0.5303789118803899, "percentage": 27.14, "elapsed_time": "11:27:33", "remaining_time": "1 day, 6:46:02", "throughput": 333.4, "total_tokens": 13753760} {"current_steps": 10860, "total_steps": 40000, "loss": 0.0648, "lr": 0.24867433142911416, "epoch": 0.5306232135440843, "percentage": 27.15, "elapsed_time": "11:27:36", "remaining_time": "1 day, 6:45:01", "throughput": 333.54, "total_tokens": 13760800} {"current_steps": 10865, "total_steps": 40000, "loss": 0.0763, "lr": 0.24862995859843612, "epoch": 0.5308675152077785, "percentage": 27.16, "elapsed_time": "11:27:39", "remaining_time": "1 day, 6:44:00", "throughput": 333.69, "total_tokens": 13768064} {"current_steps": 10870, "total_steps": 40000, "loss": 0.0872, "lr": 0.24858557055777897, "epoch": 0.5311118168714729, "percentage": 27.18, "elapsed_time": "11:27:42", "remaining_time": "1 day, 6:42:58", "throughput": 333.81, "total_tokens": 13773920} {"current_steps": 10875, "total_steps": 40000, "loss": 0.0632, "lr": 0.24854116731398793, "epoch": 0.5313561185351672, "percentage": 27.19, "elapsed_time": "11:27:45", "remaining_time": "1 day, 6:41:56", "throughput": 333.93, "total_tokens": 13780064} {"current_steps": 10880, "total_steps": 40000, "loss": 0.0775, "lr": 0.24849674887391052, "epoch": 0.5316004201988616, "percentage": 27.2, "elapsed_time": "11:27:48", "remaining_time": "1 day, 6:40:54", "throughput": 334.05, "total_tokens": 13785856} {"current_steps": 10885, "total_steps": 40000, "loss": 0.0608, "lr": 0.2484523152443967, "epoch": 0.5318447218625559, "percentage": 27.21, "elapsed_time": "11:27:51", "remaining_time": "1 day, 6:39:53", "throughput": 334.18, "total_tokens": 13792256} {"current_steps": 10890, "total_steps": 40000, "loss": 0.0728, "lr": 0.24840786643229862, "epoch": 0.5320890235262502, "percentage": 27.22, "elapsed_time": "11:27:55", "remaining_time": "1 day, 6:38:52", "throughput": 334.32, "total_tokens": 13798880} {"current_steps": 10895, "total_steps": 40000, "loss": 0.0611, "lr": 0.2483634024444709, "epoch": 0.5323333251899446, "percentage": 27.24, "elapsed_time": "11:27:58", "remaining_time": "1 day, 6:37:50", "throughput": 334.44, "total_tokens": 13805088} {"current_steps": 10900, "total_steps": 40000, "loss": 0.0562, "lr": 0.24831892328777033, "epoch": 0.5325776268536389, "percentage": 27.25, "elapsed_time": "11:28:01", "remaining_time": "1 day, 6:36:49", "throughput": 334.56, "total_tokens": 13811072} {"current_steps": 10905, "total_steps": 40000, "loss": 0.0744, "lr": 0.2482744289690563, "epoch": 0.5328219285173332, "percentage": 27.26, "elapsed_time": "11:28:04", "remaining_time": "1 day, 6:35:47", "throughput": 334.68, "total_tokens": 13817184} {"current_steps": 10910, "total_steps": 40000, "loss": 0.0612, "lr": 0.2482299194951903, "epoch": 0.5330662301810275, "percentage": 27.27, "elapsed_time": "11:28:07", "remaining_time": "1 day, 6:34:46", "throughput": 334.82, "total_tokens": 13823904} {"current_steps": 10915, "total_steps": 40000, "loss": 0.0603, "lr": 0.2481853948730363, "epoch": 0.5333105318447219, "percentage": 27.29, "elapsed_time": "11:28:10", "remaining_time": "1 day, 6:33:46", "throughput": 334.96, "total_tokens": 13830496} {"current_steps": 10920, "total_steps": 40000, "loss": 0.0824, "lr": 0.24814085510946052, "epoch": 0.5335548335084161, "percentage": 27.3, "elapsed_time": "11:28:13", "remaining_time": "1 day, 6:32:44", "throughput": 335.08, "total_tokens": 13836608} {"current_steps": 10925, "total_steps": 40000, "loss": 0.0585, "lr": 0.24809630021133158, "epoch": 0.5337991351721105, "percentage": 27.31, "elapsed_time": "11:28:16", "remaining_time": "1 day, 6:31:43", "throughput": 335.21, "total_tokens": 13843072} {"current_steps": 10930, "total_steps": 40000, "loss": 0.0654, "lr": 0.24805173018552037, "epoch": 0.5340434368358048, "percentage": 27.32, "elapsed_time": "11:28:19", "remaining_time": "1 day, 6:30:42", "throughput": 335.34, "total_tokens": 13849344} {"current_steps": 10935, "total_steps": 40000, "loss": 0.0819, "lr": 0.2480071450389002, "epoch": 0.5342877384994992, "percentage": 27.34, "elapsed_time": "11:28:22", "remaining_time": "1 day, 6:29:42", "throughput": 335.47, "total_tokens": 13855968} {"current_steps": 10940, "total_steps": 40000, "loss": 0.0633, "lr": 0.24796254477834662, "epoch": 0.5345320401631936, "percentage": 27.35, "elapsed_time": "11:28:25", "remaining_time": "1 day, 6:28:41", "throughput": 335.6, "total_tokens": 13862176} {"current_steps": 10945, "total_steps": 40000, "loss": 0.0914, "lr": 0.24791792941073754, "epoch": 0.5347763418268878, "percentage": 27.36, "elapsed_time": "11:28:28", "remaining_time": "1 day, 6:27:40", "throughput": 335.72, "total_tokens": 13868032} {"current_steps": 10950, "total_steps": 40000, "loss": 0.0603, "lr": 0.2478732989429533, "epoch": 0.5350206434905822, "percentage": 27.38, "elapsed_time": "11:28:31", "remaining_time": "1 day, 6:26:39", "throughput": 335.84, "total_tokens": 13874272} {"current_steps": 10955, "total_steps": 40000, "loss": 0.0543, "lr": 0.24782865338187632, "epoch": 0.5352649451542765, "percentage": 27.39, "elapsed_time": "11:28:35", "remaining_time": "1 day, 6:25:38", "throughput": 335.97, "total_tokens": 13880768} {"current_steps": 10960, "total_steps": 40000, "loss": 0.0534, "lr": 0.2477839927343916, "epoch": 0.5355092468179709, "percentage": 27.4, "elapsed_time": "11:28:38", "remaining_time": "1 day, 6:24:37", "throughput": 336.09, "total_tokens": 13886624} {"current_steps": 10965, "total_steps": 40000, "loss": 0.0341, "lr": 0.2477393170073864, "epoch": 0.5357535484816651, "percentage": 27.41, "elapsed_time": "11:28:41", "remaining_time": "1 day, 6:23:37", "throughput": 336.22, "total_tokens": 13892864} {"current_steps": 10970, "total_steps": 40000, "loss": 0.0472, "lr": 0.2476946262077503, "epoch": 0.5359978501453595, "percentage": 27.43, "elapsed_time": "11:28:44", "remaining_time": "1 day, 6:22:37", "throughput": 336.36, "total_tokens": 13899808} {"current_steps": 10975, "total_steps": 40000, "loss": 0.0695, "lr": 0.24764992034237507, "epoch": 0.5362421518090538, "percentage": 27.44, "elapsed_time": "11:28:47", "remaining_time": "1 day, 6:21:36", "throughput": 336.48, "total_tokens": 13906016} {"current_steps": 10980, "total_steps": 40000, "loss": 0.0569, "lr": 0.24760519941815498, "epoch": 0.5364864534727481, "percentage": 27.45, "elapsed_time": "11:28:50", "remaining_time": "1 day, 6:20:36", "throughput": 336.61, "total_tokens": 13912448} {"current_steps": 10985, "total_steps": 40000, "loss": 0.0627, "lr": 0.2475604634419866, "epoch": 0.5367307551364425, "percentage": 27.46, "elapsed_time": "11:28:53", "remaining_time": "1 day, 6:19:35", "throughput": 336.75, "total_tokens": 13918944} {"current_steps": 10990, "total_steps": 40000, "loss": 0.0802, "lr": 0.24751571242076872, "epoch": 0.5369750568001368, "percentage": 27.47, "elapsed_time": "11:28:56", "remaining_time": "1 day, 6:18:35", "throughput": 336.87, "total_tokens": 13925184} {"current_steps": 10995, "total_steps": 40000, "loss": 0.0795, "lr": 0.2474709463614025, "epoch": 0.5372193584638312, "percentage": 27.49, "elapsed_time": "11:28:59", "remaining_time": "1 day, 6:17:35", "throughput": 337.0, "total_tokens": 13931424} {"current_steps": 11000, "total_steps": 40000, "loss": 0.0522, "lr": 0.24742616527079145, "epoch": 0.5374636601275254, "percentage": 27.5, "elapsed_time": "11:29:02", "remaining_time": "1 day, 6:16:34", "throughput": 337.12, "total_tokens": 13937504} {"current_steps": 11000, "total_steps": 40000, "eval_loss": 0.06961502879858017, "epoch": 0.5374636601275254, "percentage": 27.5, "elapsed_time": "11:39:42", "remaining_time": "1 day, 6:44:41", "throughput": 331.98, "total_tokens": 13937504} {"current_steps": 11005, "total_steps": 40000, "loss": 0.0488, "lr": 0.24738136915584139, "epoch": 0.5377079617912198, "percentage": 27.51, "elapsed_time": "11:39:46", "remaining_time": "1 day, 6:43:42", "throughput": 332.1, "total_tokens": 13943648} {"current_steps": 11010, "total_steps": 40000, "loss": 0.063, "lr": 0.24733655802346047, "epoch": 0.5379522634549141, "percentage": 27.52, "elapsed_time": "11:39:49", "remaining_time": "1 day, 6:42:40", "throughput": 332.21, "total_tokens": 13949376} {"current_steps": 11015, "total_steps": 40000, "loss": 0.1013, "lr": 0.24729173188055906, "epoch": 0.5381965651186085, "percentage": 27.54, "elapsed_time": "11:39:52", "remaining_time": "1 day, 6:41:39", "throughput": 332.34, "total_tokens": 13955680} {"current_steps": 11020, "total_steps": 40000, "loss": 0.062, "lr": 0.24724689073404996, "epoch": 0.5384408667823027, "percentage": 27.55, "elapsed_time": "11:39:55", "remaining_time": "1 day, 6:40:38", "throughput": 332.46, "total_tokens": 13962048} {"current_steps": 11025, "total_steps": 40000, "loss": 0.1021, "lr": 0.24720203459084822, "epoch": 0.5386851684459971, "percentage": 27.56, "elapsed_time": "11:39:58", "remaining_time": "1 day, 6:39:37", "throughput": 332.58, "total_tokens": 13967808} {"current_steps": 11030, "total_steps": 40000, "loss": 0.0723, "lr": 0.24715716345787123, "epoch": 0.5389294701096915, "percentage": 27.57, "elapsed_time": "11:40:01", "remaining_time": "1 day, 6:38:36", "throughput": 332.7, "total_tokens": 13973984} {"current_steps": 11035, "total_steps": 40000, "loss": 0.0552, "lr": 0.2471122773420387, "epoch": 0.5391737717733858, "percentage": 27.59, "elapsed_time": "11:40:04", "remaining_time": "1 day, 6:37:35", "throughput": 332.83, "total_tokens": 13980288} {"current_steps": 11040, "total_steps": 40000, "loss": 0.0604, "lr": 0.24706737625027259, "epoch": 0.5394180734370801, "percentage": 27.6, "elapsed_time": "11:40:07", "remaining_time": "1 day, 6:36:34", "throughput": 332.95, "total_tokens": 13986432} {"current_steps": 11045, "total_steps": 40000, "loss": 0.051, "lr": 0.24702246018949725, "epoch": 0.5396623751007744, "percentage": 27.61, "elapsed_time": "11:40:10", "remaining_time": "1 day, 6:35:33", "throughput": 333.07, "total_tokens": 13992544} {"current_steps": 11050, "total_steps": 40000, "loss": 0.0864, "lr": 0.2469775291666393, "epoch": 0.5399066767644688, "percentage": 27.62, "elapsed_time": "11:40:14", "remaining_time": "1 day, 6:34:32", "throughput": 333.2, "total_tokens": 13999200} {"current_steps": 11055, "total_steps": 40000, "loss": 0.0788, "lr": 0.24693258318862765, "epoch": 0.5401509784281631, "percentage": 27.64, "elapsed_time": "11:40:17", "remaining_time": "1 day, 6:33:32", "throughput": 333.33, "total_tokens": 14005344} {"current_steps": 11060, "total_steps": 40000, "loss": 0.0554, "lr": 0.2468876222623935, "epoch": 0.5403952800918574, "percentage": 27.65, "elapsed_time": "11:40:20", "remaining_time": "1 day, 6:32:31", "throughput": 333.45, "total_tokens": 14011616} {"current_steps": 11065, "total_steps": 40000, "loss": 0.0463, "lr": 0.2468426463948705, "epoch": 0.5406395817555517, "percentage": 27.66, "elapsed_time": "11:40:23", "remaining_time": "1 day, 6:31:30", "throughput": 333.59, "total_tokens": 14018368} {"current_steps": 11070, "total_steps": 40000, "loss": 0.0605, "lr": 0.24679765559299438, "epoch": 0.5408838834192461, "percentage": 27.68, "elapsed_time": "11:40:26", "remaining_time": "1 day, 6:30:30", "throughput": 333.71, "total_tokens": 14024672} {"current_steps": 11075, "total_steps": 40000, "loss": 0.0766, "lr": 0.24675264986370332, "epoch": 0.5411281850829404, "percentage": 27.69, "elapsed_time": "11:40:29", "remaining_time": "1 day, 6:29:29", "throughput": 333.84, "total_tokens": 14031072} {"current_steps": 11080, "total_steps": 40000, "loss": 0.0762, "lr": 0.2467076292139378, "epoch": 0.5413724867466347, "percentage": 27.7, "elapsed_time": "11:40:32", "remaining_time": "1 day, 6:28:29", "throughput": 333.96, "total_tokens": 14037056} {"current_steps": 11085, "total_steps": 40000, "loss": 0.0649, "lr": 0.24666259365064055, "epoch": 0.5416167884103291, "percentage": 27.71, "elapsed_time": "11:40:35", "remaining_time": "1 day, 6:27:28", "throughput": 334.08, "total_tokens": 14043232} {"current_steps": 11090, "total_steps": 40000, "loss": 0.0679, "lr": 0.24661754318075663, "epoch": 0.5418610900740234, "percentage": 27.73, "elapsed_time": "11:40:38", "remaining_time": "1 day, 6:26:28", "throughput": 334.2, "total_tokens": 14049440} {"current_steps": 11095, "total_steps": 40000, "loss": 0.0667, "lr": 0.2465724778112334, "epoch": 0.5421053917377178, "percentage": 27.74, "elapsed_time": "11:40:41", "remaining_time": "1 day, 6:25:28", "throughput": 334.34, "total_tokens": 14056352} {"current_steps": 11100, "total_steps": 40000, "loss": 0.0566, "lr": 0.24652739754902042, "epoch": 0.542349693401412, "percentage": 27.75, "elapsed_time": "11:40:44", "remaining_time": "1 day, 6:24:27", "throughput": 334.47, "total_tokens": 14062784} {"current_steps": 11105, "total_steps": 40000, "loss": 0.066, "lr": 0.24648230240106975, "epoch": 0.5425939950651064, "percentage": 27.76, "elapsed_time": "11:40:47", "remaining_time": "1 day, 6:23:27", "throughput": 334.59, "total_tokens": 14068864} {"current_steps": 11110, "total_steps": 40000, "loss": 0.0466, "lr": 0.2464371923743356, "epoch": 0.5428382967288007, "percentage": 27.77, "elapsed_time": "11:40:50", "remaining_time": "1 day, 6:22:27", "throughput": 334.72, "total_tokens": 14075456} {"current_steps": 11115, "total_steps": 40000, "loss": 0.07, "lr": 0.24639206747577444, "epoch": 0.5430825983924951, "percentage": 27.79, "elapsed_time": "11:40:53", "remaining_time": "1 day, 6:21:27", "throughput": 334.85, "total_tokens": 14081792} {"current_steps": 11120, "total_steps": 40000, "loss": 0.0473, "lr": 0.24634692771234515, "epoch": 0.5433269000561893, "percentage": 27.8, "elapsed_time": "11:40:57", "remaining_time": "1 day, 6:20:27", "throughput": 334.98, "total_tokens": 14088416} {"current_steps": 11125, "total_steps": 40000, "loss": 0.0691, "lr": 0.2463017730910088, "epoch": 0.5435712017198837, "percentage": 27.81, "elapsed_time": "11:41:00", "remaining_time": "1 day, 6:19:27", "throughput": 335.11, "total_tokens": 14094976} {"current_steps": 11130, "total_steps": 40000, "loss": 0.0623, "lr": 0.2462566036187289, "epoch": 0.5438155033835781, "percentage": 27.82, "elapsed_time": "11:41:03", "remaining_time": "1 day, 6:18:27", "throughput": 335.25, "total_tokens": 14101568} {"current_steps": 11135, "total_steps": 40000, "loss": 0.0702, "lr": 0.24621141930247106, "epoch": 0.5440598050472724, "percentage": 27.84, "elapsed_time": "11:41:06", "remaining_time": "1 day, 6:17:27", "throughput": 335.38, "total_tokens": 14108128} {"current_steps": 11140, "total_steps": 40000, "loss": 0.0852, "lr": 0.2461662201492033, "epoch": 0.5443041067109667, "percentage": 27.85, "elapsed_time": "11:41:09", "remaining_time": "1 day, 6:16:28", "throughput": 335.5, "total_tokens": 14114240} {"current_steps": 11145, "total_steps": 40000, "loss": 0.0689, "lr": 0.24612100616589586, "epoch": 0.544548408374661, "percentage": 27.86, "elapsed_time": "11:41:12", "remaining_time": "1 day, 6:15:28", "throughput": 335.62, "total_tokens": 14120512} {"current_steps": 11150, "total_steps": 40000, "loss": 0.0445, "lr": 0.24607577735952135, "epoch": 0.5447927100383554, "percentage": 27.88, "elapsed_time": "11:41:15", "remaining_time": "1 day, 6:14:28", "throughput": 335.75, "total_tokens": 14126720} {"current_steps": 11155, "total_steps": 40000, "loss": 0.0865, "lr": 0.24603053373705464, "epoch": 0.5450370117020497, "percentage": 27.89, "elapsed_time": "11:41:18", "remaining_time": "1 day, 6:13:28", "throughput": 335.87, "total_tokens": 14132832} {"current_steps": 11160, "total_steps": 40000, "loss": 0.0631, "lr": 0.2459852753054728, "epoch": 0.545281313365744, "percentage": 27.9, "elapsed_time": "11:41:21", "remaining_time": "1 day, 6:12:28", "throughput": 335.99, "total_tokens": 14139136} {"current_steps": 11165, "total_steps": 40000, "loss": 0.0878, "lr": 0.24594000207175526, "epoch": 0.5455256150294383, "percentage": 27.91, "elapsed_time": "11:41:24", "remaining_time": "1 day, 6:11:29", "throughput": 336.12, "total_tokens": 14145600} {"current_steps": 11170, "total_steps": 40000, "loss": 0.0706, "lr": 0.2458947140428838, "epoch": 0.5457699166931327, "percentage": 27.93, "elapsed_time": "11:41:27", "remaining_time": "1 day, 6:10:29", "throughput": 336.25, "total_tokens": 14151968} {"current_steps": 11175, "total_steps": 40000, "loss": 0.0809, "lr": 0.24584941122584233, "epoch": 0.5460142183568271, "percentage": 27.94, "elapsed_time": "11:41:31", "remaining_time": "1 day, 6:09:30", "throughput": 336.37, "total_tokens": 14158240} {"current_steps": 11180, "total_steps": 40000, "loss": 0.0582, "lr": 0.24580409362761713, "epoch": 0.5462585200205213, "percentage": 27.95, "elapsed_time": "11:41:34", "remaining_time": "1 day, 6:08:31", "throughput": 336.5, "total_tokens": 14164864} {"current_steps": 11185, "total_steps": 40000, "loss": 0.0824, "lr": 0.2457587612551967, "epoch": 0.5465028216842157, "percentage": 27.96, "elapsed_time": "11:41:37", "remaining_time": "1 day, 6:07:31", "throughput": 336.63, "total_tokens": 14171008} {"current_steps": 11190, "total_steps": 40000, "loss": 0.091, "lr": 0.24571341411557193, "epoch": 0.54674712334791, "percentage": 27.98, "elapsed_time": "11:41:40", "remaining_time": "1 day, 6:06:32", "throughput": 336.75, "total_tokens": 14177216} {"current_steps": 11195, "total_steps": 40000, "loss": 0.0862, "lr": 0.2456680522157359, "epoch": 0.5469914250116044, "percentage": 27.99, "elapsed_time": "11:41:43", "remaining_time": "1 day, 6:05:33", "throughput": 336.88, "total_tokens": 14183712} {"current_steps": 11200, "total_steps": 40000, "loss": 0.0684, "lr": 0.245622675562684, "epoch": 0.5472357266752986, "percentage": 28.0, "elapsed_time": "11:41:46", "remaining_time": "1 day, 6:04:33", "throughput": 337.01, "total_tokens": 14190304} {"current_steps": 11200, "total_steps": 40000, "eval_loss": 0.0725501999258995, "epoch": 0.5472357266752986, "percentage": 28.0, "elapsed_time": "11:52:25", "remaining_time": "1 day, 6:31:56", "throughput": 331.97, "total_tokens": 14190304} {"current_steps": 11205, "total_steps": 40000, "loss": 0.0655, "lr": 0.24557728416341384, "epoch": 0.547480028338993, "percentage": 28.01, "elapsed_time": "11:52:29", "remaining_time": "1 day, 6:30:59", "throughput": 332.09, "total_tokens": 14196960} {"current_steps": 11210, "total_steps": 40000, "loss": 0.0613, "lr": 0.24553187802492538, "epoch": 0.5477243300026873, "percentage": 28.02, "elapsed_time": "11:52:32", "remaining_time": "1 day, 6:29:59", "throughput": 332.22, "total_tokens": 14203360} {"current_steps": 11215, "total_steps": 40000, "loss": 0.0464, "lr": 0.24548645715422074, "epoch": 0.5479686316663817, "percentage": 28.04, "elapsed_time": "11:52:36", "remaining_time": "1 day, 6:28:59", "throughput": 332.36, "total_tokens": 14210240} {"current_steps": 11220, "total_steps": 40000, "loss": 0.0559, "lr": 0.2454410215583045, "epoch": 0.5482129333300759, "percentage": 28.05, "elapsed_time": "11:52:39", "remaining_time": "1 day, 6:28:00", "throughput": 332.48, "total_tokens": 14216736} {"current_steps": 11225, "total_steps": 40000, "loss": 0.0485, "lr": 0.24539557124418332, "epoch": 0.5484572349937703, "percentage": 28.06, "elapsed_time": "11:52:42", "remaining_time": "1 day, 6:26:59", "throughput": 332.6, "total_tokens": 14222784} {"current_steps": 11230, "total_steps": 40000, "loss": 0.1009, "lr": 0.24535010621886624, "epoch": 0.5487015366574647, "percentage": 28.07, "elapsed_time": "11:52:45", "remaining_time": "1 day, 6:25:59", "throughput": 332.72, "total_tokens": 14228896} {"current_steps": 11235, "total_steps": 40000, "loss": 0.0692, "lr": 0.2453046264893646, "epoch": 0.548945838321159, "percentage": 28.09, "elapsed_time": "11:52:48", "remaining_time": "1 day, 6:24:59", "throughput": 332.85, "total_tokens": 14235360} {"current_steps": 11240, "total_steps": 40000, "loss": 0.0655, "lr": 0.24525913206269184, "epoch": 0.5491901399848533, "percentage": 28.1, "elapsed_time": "11:52:51", "remaining_time": "1 day, 6:24:00", "throughput": 332.97, "total_tokens": 14241568} {"current_steps": 11245, "total_steps": 40000, "loss": 0.1048, "lr": 0.2452136229458638, "epoch": 0.5494344416485476, "percentage": 28.11, "elapsed_time": "11:52:54", "remaining_time": "1 day, 6:23:00", "throughput": 333.09, "total_tokens": 14247712} {"current_steps": 11250, "total_steps": 40000, "loss": 0.0649, "lr": 0.24516809914589857, "epoch": 0.549678743312242, "percentage": 28.12, "elapsed_time": "11:52:57", "remaining_time": "1 day, 6:22:00", "throughput": 333.21, "total_tokens": 14253824} {"current_steps": 11255, "total_steps": 40000, "loss": 0.0867, "lr": 0.2451225606698165, "epoch": 0.5499230449759362, "percentage": 28.14, "elapsed_time": "11:53:00", "remaining_time": "1 day, 6:21:00", "throughput": 333.33, "total_tokens": 14259840} {"current_steps": 11260, "total_steps": 40000, "loss": 0.0657, "lr": 0.2450770075246402, "epoch": 0.5501673466396306, "percentage": 28.15, "elapsed_time": "11:53:03", "remaining_time": "1 day, 6:20:01", "throughput": 333.46, "total_tokens": 14266656} {"current_steps": 11265, "total_steps": 40000, "loss": 0.0652, "lr": 0.24503143971739455, "epoch": 0.5504116483033249, "percentage": 28.16, "elapsed_time": "11:53:06", "remaining_time": "1 day, 6:19:01", "throughput": 333.58, "total_tokens": 14272736} {"current_steps": 11270, "total_steps": 40000, "loss": 0.0478, "lr": 0.24498585725510663, "epoch": 0.5506559499670193, "percentage": 28.18, "elapsed_time": "11:53:09", "remaining_time": "1 day, 6:18:01", "throughput": 333.71, "total_tokens": 14279360} {"current_steps": 11275, "total_steps": 40000, "loss": 0.0783, "lr": 0.24494026014480583, "epoch": 0.5509002516307137, "percentage": 28.19, "elapsed_time": "11:53:12", "remaining_time": "1 day, 6:17:02", "throughput": 333.83, "total_tokens": 14285408} {"current_steps": 11280, "total_steps": 40000, "loss": 0.0489, "lr": 0.24489464839352387, "epoch": 0.5511445532944079, "percentage": 28.2, "elapsed_time": "11:53:15", "remaining_time": "1 day, 6:16:02", "throughput": 333.94, "total_tokens": 14291296} {"current_steps": 11285, "total_steps": 40000, "loss": 0.0666, "lr": 0.2448490220082946, "epoch": 0.5513888549581023, "percentage": 28.21, "elapsed_time": "11:53:19", "remaining_time": "1 day, 6:15:03", "throughput": 334.08, "total_tokens": 14298496} {"current_steps": 11290, "total_steps": 40000, "loss": 0.0866, "lr": 0.24480338099615415, "epoch": 0.5516331566217966, "percentage": 28.23, "elapsed_time": "11:53:22", "remaining_time": "1 day, 6:14:04", "throughput": 334.21, "total_tokens": 14305024} {"current_steps": 11295, "total_steps": 40000, "loss": 0.069, "lr": 0.244757725364141, "epoch": 0.551877458285491, "percentage": 28.24, "elapsed_time": "11:53:25", "remaining_time": "1 day, 6:13:04", "throughput": 334.33, "total_tokens": 14311264} {"current_steps": 11300, "total_steps": 40000, "loss": 0.0343, "lr": 0.24471205511929583, "epoch": 0.5521217599491852, "percentage": 28.25, "elapsed_time": "11:53:28", "remaining_time": "1 day, 6:12:05", "throughput": 334.46, "total_tokens": 14317888} {"current_steps": 11305, "total_steps": 40000, "loss": 0.0823, "lr": 0.24466637026866145, "epoch": 0.5523660616128796, "percentage": 28.26, "elapsed_time": "11:53:31", "remaining_time": "1 day, 6:11:06", "throughput": 334.58, "total_tokens": 14324000} {"current_steps": 11310, "total_steps": 40000, "loss": 0.0475, "lr": 0.2446206708192832, "epoch": 0.5526103632765739, "percentage": 28.27, "elapsed_time": "11:53:34", "remaining_time": "1 day, 6:10:07", "throughput": 334.71, "total_tokens": 14330592} {"current_steps": 11315, "total_steps": 40000, "loss": 0.0384, "lr": 0.2445749567782084, "epoch": 0.5528546649402682, "percentage": 28.29, "elapsed_time": "11:53:37", "remaining_time": "1 day, 6:09:08", "throughput": 334.84, "total_tokens": 14336864} {"current_steps": 11320, "total_steps": 40000, "loss": 0.0752, "lr": 0.2445292281524868, "epoch": 0.5530989666039626, "percentage": 28.3, "elapsed_time": "11:53:40", "remaining_time": "1 day, 6:08:09", "throughput": 334.96, "total_tokens": 14343104} {"current_steps": 11325, "total_steps": 40000, "loss": 0.0744, "lr": 0.24448348494917022, "epoch": 0.5533432682676569, "percentage": 28.31, "elapsed_time": "11:53:43", "remaining_time": "1 day, 6:07:10", "throughput": 335.09, "total_tokens": 14349696} {"current_steps": 11330, "total_steps": 40000, "loss": 0.079, "lr": 0.24443772717531295, "epoch": 0.5535875699313513, "percentage": 28.32, "elapsed_time": "11:53:46", "remaining_time": "1 day, 6:06:11", "throughput": 335.21, "total_tokens": 14356064} {"current_steps": 11335, "total_steps": 40000, "loss": 0.0604, "lr": 0.24439195483797138, "epoch": 0.5538318715950455, "percentage": 28.34, "elapsed_time": "11:53:49", "remaining_time": "1 day, 6:05:12", "throughput": 335.34, "total_tokens": 14362432} {"current_steps": 11340, "total_steps": 40000, "loss": 0.0842, "lr": 0.24434616794420416, "epoch": 0.5540761732587399, "percentage": 28.35, "elapsed_time": "11:53:53", "remaining_time": "1 day, 6:04:13", "throughput": 335.47, "total_tokens": 14369056} {"current_steps": 11345, "total_steps": 40000, "loss": 0.0743, "lr": 0.24430036650107223, "epoch": 0.5543204749224342, "percentage": 28.36, "elapsed_time": "11:53:56", "remaining_time": "1 day, 6:03:15", "throughput": 335.6, "total_tokens": 14375840} {"current_steps": 11350, "total_steps": 40000, "loss": 0.0512, "lr": 0.2442545505156387, "epoch": 0.5545647765861286, "percentage": 28.38, "elapsed_time": "11:53:59", "remaining_time": "1 day, 6:02:16", "throughput": 335.73, "total_tokens": 14382496} {"current_steps": 11355, "total_steps": 40000, "loss": 0.0556, "lr": 0.24420871999496904, "epoch": 0.5548090782498228, "percentage": 28.39, "elapsed_time": "11:54:02", "remaining_time": "1 day, 6:01:17", "throughput": 335.85, "total_tokens": 14388832} {"current_steps": 11360, "total_steps": 40000, "loss": 0.0818, "lr": 0.24416287494613084, "epoch": 0.5550533799135172, "percentage": 28.4, "elapsed_time": "11:54:05", "remaining_time": "1 day, 6:00:19", "throughput": 335.98, "total_tokens": 14395104} {"current_steps": 11365, "total_steps": 40000, "loss": 0.0859, "lr": 0.24411701537619399, "epoch": 0.5552976815772115, "percentage": 28.41, "elapsed_time": "11:54:08", "remaining_time": "1 day, 5:59:20", "throughput": 336.1, "total_tokens": 14401472} {"current_steps": 11370, "total_steps": 40000, "loss": 0.0523, "lr": 0.24407114129223062, "epoch": 0.5555419832409059, "percentage": 28.43, "elapsed_time": "11:54:11", "remaining_time": "1 day, 5:58:21", "throughput": 336.21, "total_tokens": 14407360} {"current_steps": 11375, "total_steps": 40000, "loss": 0.0782, "lr": 0.2440252527013151, "epoch": 0.5557862849046002, "percentage": 28.44, "elapsed_time": "11:54:14", "remaining_time": "1 day, 5:57:23", "throughput": 336.34, "total_tokens": 14413568} {"current_steps": 11380, "total_steps": 40000, "loss": 0.0625, "lr": 0.24397934961052403, "epoch": 0.5560305865682945, "percentage": 28.45, "elapsed_time": "11:54:17", "remaining_time": "1 day, 5:56:24", "throughput": 336.46, "total_tokens": 14419776} {"current_steps": 11385, "total_steps": 40000, "loss": 0.0425, "lr": 0.24393343202693618, "epoch": 0.5562748882319889, "percentage": 28.46, "elapsed_time": "11:54:20", "remaining_time": "1 day, 5:55:26", "throughput": 336.59, "total_tokens": 14426368} {"current_steps": 11390, "total_steps": 40000, "loss": 0.027, "lr": 0.2438874999576327, "epoch": 0.5565191898956832, "percentage": 28.48, "elapsed_time": "11:54:23", "remaining_time": "1 day, 5:54:27", "throughput": 336.71, "total_tokens": 14432480} {"current_steps": 11395, "total_steps": 40000, "loss": 0.0479, "lr": 0.24384155340969688, "epoch": 0.5567634915593775, "percentage": 28.49, "elapsed_time": "11:54:26", "remaining_time": "1 day, 5:53:29", "throughput": 336.83, "total_tokens": 14438976} {"current_steps": 11400, "total_steps": 40000, "loss": 0.0817, "lr": 0.24379559239021423, "epoch": 0.5570077932230718, "percentage": 28.5, "elapsed_time": "11:54:29", "remaining_time": "1 day, 5:52:31", "throughput": 336.96, "total_tokens": 14445312} {"current_steps": 11400, "total_steps": 40000, "eval_loss": 0.07307746261358261, "epoch": 0.5570077932230718, "percentage": 28.5, "elapsed_time": "12:05:10", "remaining_time": "1 day, 6:19:18", "throughput": 331.99, "total_tokens": 14445312} {"current_steps": 11405, "total_steps": 40000, "loss": 0.09, "lr": 0.2437496169062725, "epoch": 0.5572520948867662, "percentage": 28.51, "elapsed_time": "12:05:14", "remaining_time": "1 day, 6:18:21", "throughput": 332.11, "total_tokens": 14451744} {"current_steps": 11410, "total_steps": 40000, "loss": 0.0647, "lr": 0.24370362696496176, "epoch": 0.5574963965504605, "percentage": 28.52, "elapsed_time": "12:05:17", "remaining_time": "1 day, 6:17:22", "throughput": 332.23, "total_tokens": 14457984} {"current_steps": 11415, "total_steps": 40000, "loss": 0.0697, "lr": 0.24365762257337417, "epoch": 0.5577406982141548, "percentage": 28.54, "elapsed_time": "12:05:20", "remaining_time": "1 day, 6:16:23", "throughput": 332.35, "total_tokens": 14464000} {"current_steps": 11420, "total_steps": 40000, "loss": 0.0771, "lr": 0.2436116037386042, "epoch": 0.5579849998778492, "percentage": 28.55, "elapsed_time": "12:05:23", "remaining_time": "1 day, 6:15:24", "throughput": 332.46, "total_tokens": 14470144} {"current_steps": 11425, "total_steps": 40000, "loss": 0.0754, "lr": 0.24356557046774852, "epoch": 0.5582293015415435, "percentage": 28.56, "elapsed_time": "12:05:27", "remaining_time": "1 day, 6:14:25", "throughput": 332.59, "total_tokens": 14476704} {"current_steps": 11430, "total_steps": 40000, "loss": 0.0691, "lr": 0.24351952276790606, "epoch": 0.5584736032052379, "percentage": 28.57, "elapsed_time": "12:05:30", "remaining_time": "1 day, 6:13:26", "throughput": 332.72, "total_tokens": 14483232} {"current_steps": 11435, "total_steps": 40000, "loss": 0.0371, "lr": 0.24347346064617797, "epoch": 0.5587179048689321, "percentage": 28.59, "elapsed_time": "12:05:33", "remaining_time": "1 day, 6:12:27", "throughput": 332.85, "total_tokens": 14490048} {"current_steps": 11440, "total_steps": 40000, "loss": 0.053, "lr": 0.24342738410966758, "epoch": 0.5589622065326265, "percentage": 28.6, "elapsed_time": "12:05:36", "remaining_time": "1 day, 6:11:28", "throughput": 332.97, "total_tokens": 14496288} {"current_steps": 11445, "total_steps": 40000, "loss": 0.0689, "lr": 0.24338129316548046, "epoch": 0.5592065081963208, "percentage": 28.61, "elapsed_time": "12:05:39", "remaining_time": "1 day, 6:10:30", "throughput": 333.09, "total_tokens": 14502656} {"current_steps": 11450, "total_steps": 40000, "loss": 0.0493, "lr": 0.24333518782072444, "epoch": 0.5594508098600152, "percentage": 28.62, "elapsed_time": "12:05:42", "remaining_time": "1 day, 6:09:31", "throughput": 333.22, "total_tokens": 14509440} {"current_steps": 11455, "total_steps": 40000, "loss": 0.0787, "lr": 0.24328906808250952, "epoch": 0.5596951115237094, "percentage": 28.64, "elapsed_time": "12:05:45", "remaining_time": "1 day, 6:08:32", "throughput": 333.34, "total_tokens": 14515328} {"current_steps": 11460, "total_steps": 40000, "loss": 0.0704, "lr": 0.243242933957948, "epoch": 0.5599394131874038, "percentage": 28.65, "elapsed_time": "12:05:48", "remaining_time": "1 day, 6:07:33", "throughput": 333.46, "total_tokens": 14521888} {"current_steps": 11465, "total_steps": 40000, "loss": 0.1072, "lr": 0.24319678545415427, "epoch": 0.5601837148510982, "percentage": 28.66, "elapsed_time": "12:05:51", "remaining_time": "1 day, 6:06:35", "throughput": 333.59, "total_tokens": 14528288} {"current_steps": 11470, "total_steps": 40000, "loss": 0.0568, "lr": 0.24315062257824507, "epoch": 0.5604280165147925, "percentage": 28.68, "elapsed_time": "12:05:54", "remaining_time": "1 day, 6:05:36", "throughput": 333.7, "total_tokens": 14534176} {"current_steps": 11475, "total_steps": 40000, "loss": 0.0696, "lr": 0.24310444533733921, "epoch": 0.5606723181784868, "percentage": 28.69, "elapsed_time": "12:05:57", "remaining_time": "1 day, 6:04:37", "throughput": 333.81, "total_tokens": 14540224} {"current_steps": 11480, "total_steps": 40000, "loss": 0.0649, "lr": 0.2430582537385579, "epoch": 0.5609166198421811, "percentage": 28.7, "elapsed_time": "12:06:01", "remaining_time": "1 day, 6:03:39", "throughput": 333.94, "total_tokens": 14546656} {"current_steps": 11485, "total_steps": 40000, "loss": 0.0581, "lr": 0.2430120477890244, "epoch": 0.5611609215058755, "percentage": 28.71, "elapsed_time": "12:06:04", "remaining_time": "1 day, 6:02:40", "throughput": 334.05, "total_tokens": 14552672} {"current_steps": 11490, "total_steps": 40000, "loss": 0.0532, "lr": 0.24296582749586426, "epoch": 0.5614052231695698, "percentage": 28.73, "elapsed_time": "12:06:07", "remaining_time": "1 day, 6:01:42", "throughput": 334.17, "total_tokens": 14558592} {"current_steps": 11495, "total_steps": 40000, "loss": 0.0765, "lr": 0.24291959286620526, "epoch": 0.5616495248332641, "percentage": 28.74, "elapsed_time": "12:06:10", "remaining_time": "1 day, 6:00:44", "throughput": 334.28, "total_tokens": 14564832} {"current_steps": 11500, "total_steps": 40000, "loss": 0.0713, "lr": 0.24287334390717738, "epoch": 0.5618938264969584, "percentage": 28.75, "elapsed_time": "12:06:13", "remaining_time": "1 day, 5:59:45", "throughput": 334.4, "total_tokens": 14571008} {"current_steps": 11505, "total_steps": 40000, "loss": 0.0482, "lr": 0.24282708062591268, "epoch": 0.5621381281606528, "percentage": 28.76, "elapsed_time": "12:06:16", "remaining_time": "1 day, 5:58:47", "throughput": 334.53, "total_tokens": 14577344} {"current_steps": 11510, "total_steps": 40000, "loss": 0.0778, "lr": 0.24278080302954563, "epoch": 0.562382429824347, "percentage": 28.78, "elapsed_time": "12:06:19", "remaining_time": "1 day, 5:57:49", "throughput": 334.64, "total_tokens": 14583424} {"current_steps": 11515, "total_steps": 40000, "loss": 0.0807, "lr": 0.24273451112521283, "epoch": 0.5626267314880414, "percentage": 28.79, "elapsed_time": "12:06:22", "remaining_time": "1 day, 5:56:50", "throughput": 334.76, "total_tokens": 14589696} {"current_steps": 11520, "total_steps": 40000, "loss": 0.0833, "lr": 0.242688204920053, "epoch": 0.5628710331517358, "percentage": 28.8, "elapsed_time": "12:06:25", "remaining_time": "1 day, 5:55:52", "throughput": 334.89, "total_tokens": 14596320} {"current_steps": 11525, "total_steps": 40000, "loss": 0.0603, "lr": 0.24264188442120715, "epoch": 0.5631153348154301, "percentage": 28.81, "elapsed_time": "12:06:28", "remaining_time": "1 day, 5:54:55", "throughput": 335.03, "total_tokens": 14603296} {"current_steps": 11530, "total_steps": 40000, "loss": 0.0542, "lr": 0.24259554963581853, "epoch": 0.5633596364791245, "percentage": 28.82, "elapsed_time": "12:06:31", "remaining_time": "1 day, 5:53:56", "throughput": 335.14, "total_tokens": 14609216} {"current_steps": 11535, "total_steps": 40000, "loss": 0.0885, "lr": 0.24254920057103257, "epoch": 0.5636039381428187, "percentage": 28.84, "elapsed_time": "12:06:34", "remaining_time": "1 day, 5:52:59", "throughput": 335.26, "total_tokens": 14615584} {"current_steps": 11540, "total_steps": 40000, "loss": 0.0611, "lr": 0.24250283723399685, "epoch": 0.5638482398065131, "percentage": 28.85, "elapsed_time": "12:06:37", "remaining_time": "1 day, 5:52:01", "throughput": 335.38, "total_tokens": 14622048} {"current_steps": 11545, "total_steps": 40000, "loss": 0.0771, "lr": 0.24245645963186108, "epoch": 0.5640925414702074, "percentage": 28.86, "elapsed_time": "12:06:41", "remaining_time": "1 day, 5:51:03", "throughput": 335.51, "total_tokens": 14628544} {"current_steps": 11550, "total_steps": 40000, "loss": 0.0459, "lr": 0.2424100677717774, "epoch": 0.5643368431339018, "percentage": 28.88, "elapsed_time": "12:06:44", "remaining_time": "1 day, 5:50:05", "throughput": 335.63, "total_tokens": 14634880} {"current_steps": 11555, "total_steps": 40000, "loss": 0.0531, "lr": 0.24236366166090004, "epoch": 0.564581144797596, "percentage": 28.89, "elapsed_time": "12:06:47", "remaining_time": "1 day, 5:49:07", "throughput": 335.75, "total_tokens": 14641024} {"current_steps": 11560, "total_steps": 40000, "loss": 0.0642, "lr": 0.24231724130638527, "epoch": 0.5648254464612904, "percentage": 28.9, "elapsed_time": "12:06:50", "remaining_time": "1 day, 5:48:09", "throughput": 335.86, "total_tokens": 14647008} {"current_steps": 11565, "total_steps": 40000, "loss": 0.0491, "lr": 0.2422708067153917, "epoch": 0.5650697481249848, "percentage": 28.91, "elapsed_time": "12:06:53", "remaining_time": "1 day, 5:47:12", "throughput": 335.99, "total_tokens": 14653568} {"current_steps": 11570, "total_steps": 40000, "loss": 0.08, "lr": 0.24222435789508026, "epoch": 0.565314049788679, "percentage": 28.93, "elapsed_time": "12:06:56", "remaining_time": "1 day, 5:46:14", "throughput": 336.11, "total_tokens": 14659840} {"current_steps": 11575, "total_steps": 40000, "loss": 0.0882, "lr": 0.24217789485261387, "epoch": 0.5655583514523734, "percentage": 28.94, "elapsed_time": "12:06:59", "remaining_time": "1 day, 5:45:17", "throughput": 336.23, "total_tokens": 14666176} {"current_steps": 11580, "total_steps": 40000, "loss": 0.0438, "lr": 0.2421314175951577, "epoch": 0.5658026531160677, "percentage": 28.95, "elapsed_time": "12:07:02", "remaining_time": "1 day, 5:44:19", "throughput": 336.34, "total_tokens": 14672160} {"current_steps": 11585, "total_steps": 40000, "loss": 0.0976, "lr": 0.2420849261298791, "epoch": 0.5660469547797621, "percentage": 28.96, "elapsed_time": "12:07:05", "remaining_time": "1 day, 5:43:21", "throughput": 336.46, "total_tokens": 14678304} {"current_steps": 11590, "total_steps": 40000, "loss": 0.065, "lr": 0.24203842046394775, "epoch": 0.5662912564434563, "percentage": 28.98, "elapsed_time": "12:07:08", "remaining_time": "1 day, 5:42:24", "throughput": 336.59, "total_tokens": 14684832} {"current_steps": 11595, "total_steps": 40000, "loss": 0.0596, "lr": 0.24199190060453535, "epoch": 0.5665355581071507, "percentage": 28.99, "elapsed_time": "12:07:11", "remaining_time": "1 day, 5:41:27", "throughput": 336.71, "total_tokens": 14691328} {"current_steps": 11600, "total_steps": 40000, "loss": 0.0492, "lr": 0.2419453665588158, "epoch": 0.566779859770845, "percentage": 29.0, "elapsed_time": "12:07:14", "remaining_time": "1 day, 5:40:29", "throughput": 336.83, "total_tokens": 14697344} {"current_steps": 11600, "total_steps": 40000, "eval_loss": 0.07016858458518982, "epoch": 0.566779859770845, "percentage": 29.0, "elapsed_time": "12:17:54", "remaining_time": "1 day, 6:06:37", "throughput": 331.96, "total_tokens": 14697344} {"current_steps": 11605, "total_steps": 40000, "loss": 0.0829, "lr": 0.24189881833396523, "epoch": 0.5670241614345394, "percentage": 29.01, "elapsed_time": "12:17:58", "remaining_time": "1 day, 6:05:41", "throughput": 332.06, "total_tokens": 14703424} {"current_steps": 11610, "total_steps": 40000, "loss": 0.0721, "lr": 0.24185225593716203, "epoch": 0.5672684630982336, "percentage": 29.03, "elapsed_time": "12:18:02", "remaining_time": "1 day, 6:04:43", "throughput": 332.18, "total_tokens": 14709696} {"current_steps": 11615, "total_steps": 40000, "loss": 0.0348, "lr": 0.2418056793755867, "epoch": 0.567512764761928, "percentage": 29.04, "elapsed_time": "12:18:05", "remaining_time": "1 day, 6:03:44", "throughput": 332.3, "total_tokens": 14715936} {"current_steps": 11620, "total_steps": 40000, "loss": 0.0359, "lr": 0.24175908865642187, "epoch": 0.5677570664256224, "percentage": 29.05, "elapsed_time": "12:18:08", "remaining_time": "1 day, 6:02:46", "throughput": 332.42, "total_tokens": 14722272} {"current_steps": 11625, "total_steps": 40000, "loss": 0.0773, "lr": 0.24171248378685248, "epoch": 0.5680013680893167, "percentage": 29.06, "elapsed_time": "12:18:11", "remaining_time": "1 day, 6:01:48", "throughput": 332.54, "total_tokens": 14728416} {"current_steps": 11630, "total_steps": 40000, "loss": 0.0796, "lr": 0.24166586477406554, "epoch": 0.568245669753011, "percentage": 29.07, "elapsed_time": "12:18:14", "remaining_time": "1 day, 6:00:50", "throughput": 332.65, "total_tokens": 14734592} {"current_steps": 11635, "total_steps": 40000, "loss": 0.0471, "lr": 0.24161923162525034, "epoch": 0.5684899714167053, "percentage": 29.09, "elapsed_time": "12:18:17", "remaining_time": "1 day, 5:59:52", "throughput": 332.78, "total_tokens": 14741312} {"current_steps": 11640, "total_steps": 40000, "loss": 0.0629, "lr": 0.2415725843475982, "epoch": 0.5687342730803997, "percentage": 29.1, "elapsed_time": "12:18:20", "remaining_time": "1 day, 5:58:54", "throughput": 332.89, "total_tokens": 14747328} {"current_steps": 11645, "total_steps": 40000, "loss": 0.0796, "lr": 0.24152592294830286, "epoch": 0.568978574744094, "percentage": 29.11, "elapsed_time": "12:18:23", "remaining_time": "1 day, 5:57:56", "throughput": 333.01, "total_tokens": 14753472} {"current_steps": 11650, "total_steps": 40000, "loss": 0.0505, "lr": 0.24147924743455995, "epoch": 0.5692228764077883, "percentage": 29.12, "elapsed_time": "12:18:26", "remaining_time": "1 day, 5:56:59", "throughput": 333.13, "total_tokens": 14760000} {"current_steps": 11655, "total_steps": 40000, "loss": 0.0748, "lr": 0.24143255781356754, "epoch": 0.5694671780714826, "percentage": 29.14, "elapsed_time": "12:18:29", "remaining_time": "1 day, 5:56:01", "throughput": 333.26, "total_tokens": 14766464} {"current_steps": 11660, "total_steps": 40000, "loss": 0.0602, "lr": 0.24138585409252566, "epoch": 0.569711479735177, "percentage": 29.15, "elapsed_time": "12:18:32", "remaining_time": "1 day, 5:55:04", "throughput": 333.39, "total_tokens": 14773536} {"current_steps": 11665, "total_steps": 40000, "loss": 0.0446, "lr": 0.24133913627863662, "epoch": 0.5699557813988714, "percentage": 29.16, "elapsed_time": "12:18:36", "remaining_time": "1 day, 5:54:06", "throughput": 333.51, "total_tokens": 14779840} {"current_steps": 11670, "total_steps": 40000, "loss": 0.0635, "lr": 0.241292404379105, "epoch": 0.5702000830625656, "percentage": 29.18, "elapsed_time": "12:18:39", "remaining_time": "1 day, 5:53:08", "throughput": 333.63, "total_tokens": 14786144} {"current_steps": 11675, "total_steps": 40000, "loss": 0.0596, "lr": 0.24124565840113735, "epoch": 0.57044438472626, "percentage": 29.19, "elapsed_time": "12:18:42", "remaining_time": "1 day, 5:52:11", "throughput": 333.76, "total_tokens": 14793024} {"current_steps": 11680, "total_steps": 40000, "loss": 0.0537, "lr": 0.2411988983519425, "epoch": 0.5706886863899543, "percentage": 29.2, "elapsed_time": "12:18:45", "remaining_time": "1 day, 5:51:13", "throughput": 333.88, "total_tokens": 14799328} {"current_steps": 11685, "total_steps": 40000, "loss": 0.05, "lr": 0.24115212423873145, "epoch": 0.5709329880536487, "percentage": 29.21, "elapsed_time": "12:18:48", "remaining_time": "1 day, 5:50:16", "throughput": 333.99, "total_tokens": 14805408} {"current_steps": 11690, "total_steps": 40000, "loss": 0.0461, "lr": 0.24110533606871737, "epoch": 0.5711772897173429, "percentage": 29.23, "elapsed_time": "12:18:51", "remaining_time": "1 day, 5:49:18", "throughput": 334.11, "total_tokens": 14811456} {"current_steps": 11695, "total_steps": 40000, "loss": 0.0683, "lr": 0.24105853384911552, "epoch": 0.5714215913810373, "percentage": 29.24, "elapsed_time": "12:18:54", "remaining_time": "1 day, 5:48:21", "throughput": 334.23, "total_tokens": 14817920} {"current_steps": 11700, "total_steps": 40000, "loss": 0.0962, "lr": 0.24101171758714346, "epoch": 0.5716658930447316, "percentage": 29.25, "elapsed_time": "12:18:57", "remaining_time": "1 day, 5:47:23", "throughput": 334.35, "total_tokens": 14824096} {"current_steps": 11705, "total_steps": 40000, "loss": 0.1068, "lr": 0.24096488729002086, "epoch": 0.571910194708426, "percentage": 29.26, "elapsed_time": "12:19:00", "remaining_time": "1 day, 5:46:26", "throughput": 334.45, "total_tokens": 14829696} {"current_steps": 11710, "total_steps": 40000, "loss": 0.0695, "lr": 0.24091804296496946, "epoch": 0.5721544963721203, "percentage": 29.28, "elapsed_time": "12:19:03", "remaining_time": "1 day, 5:45:28", "throughput": 334.57, "total_tokens": 14836032} {"current_steps": 11715, "total_steps": 40000, "loss": 0.053, "lr": 0.2408711846192133, "epoch": 0.5723987980358146, "percentage": 29.29, "elapsed_time": "12:19:06", "remaining_time": "1 day, 5:44:31", "throughput": 334.69, "total_tokens": 14842400} {"current_steps": 11720, "total_steps": 40000, "loss": 0.0908, "lr": 0.24082431225997855, "epoch": 0.572643099699509, "percentage": 29.3, "elapsed_time": "12:19:09", "remaining_time": "1 day, 5:43:34", "throughput": 334.82, "total_tokens": 14849056} {"current_steps": 11725, "total_steps": 40000, "loss": 0.0619, "lr": 0.24077742589449344, "epoch": 0.5728874013632033, "percentage": 29.31, "elapsed_time": "12:19:12", "remaining_time": "1 day, 5:42:37", "throughput": 334.94, "total_tokens": 14855392} {"current_steps": 11730, "total_steps": 40000, "loss": 0.0924, "lr": 0.24073052552998844, "epoch": 0.5731317030268976, "percentage": 29.33, "elapsed_time": "12:19:15", "remaining_time": "1 day, 5:41:40", "throughput": 335.05, "total_tokens": 14861440} {"current_steps": 11735, "total_steps": 40000, "loss": 0.0537, "lr": 0.2406836111736963, "epoch": 0.5733760046905919, "percentage": 29.34, "elapsed_time": "12:19:19", "remaining_time": "1 day, 5:40:43", "throughput": 335.17, "total_tokens": 14867776} {"current_steps": 11740, "total_steps": 40000, "loss": 0.078, "lr": 0.2406366828328517, "epoch": 0.5736203063542863, "percentage": 29.35, "elapsed_time": "12:19:22", "remaining_time": "1 day, 5:39:46", "throughput": 335.28, "total_tokens": 14873920} {"current_steps": 11745, "total_steps": 40000, "loss": 0.1012, "lr": 0.2405897405146915, "epoch": 0.5738646080179806, "percentage": 29.36, "elapsed_time": "12:19:25", "remaining_time": "1 day, 5:38:49", "throughput": 335.4, "total_tokens": 14880224} {"current_steps": 11750, "total_steps": 40000, "loss": 0.083, "lr": 0.240542784226455, "epoch": 0.5741089096816749, "percentage": 29.38, "elapsed_time": "12:19:28", "remaining_time": "1 day, 5:37:52", "throughput": 335.53, "total_tokens": 14886976} {"current_steps": 11755, "total_steps": 40000, "loss": 0.0611, "lr": 0.24049581397538328, "epoch": 0.5743532113453692, "percentage": 29.39, "elapsed_time": "12:19:31", "remaining_time": "1 day, 5:36:56", "throughput": 335.65, "total_tokens": 14893280} {"current_steps": 11760, "total_steps": 40000, "loss": 0.079, "lr": 0.24044882976871984, "epoch": 0.5745975130090636, "percentage": 29.4, "elapsed_time": "12:19:34", "remaining_time": "1 day, 5:35:59", "throughput": 335.76, "total_tokens": 14899168} {"current_steps": 11765, "total_steps": 40000, "loss": 0.0832, "lr": 0.2404018316137102, "epoch": 0.574841814672758, "percentage": 29.41, "elapsed_time": "12:19:37", "remaining_time": "1 day, 5:35:02", "throughput": 335.88, "total_tokens": 14905376} {"current_steps": 11770, "total_steps": 40000, "loss": 0.0627, "lr": 0.24035481951760204, "epoch": 0.5750861163364522, "percentage": 29.43, "elapsed_time": "12:19:40", "remaining_time": "1 day, 5:34:05", "throughput": 335.99, "total_tokens": 14911648} {"current_steps": 11775, "total_steps": 40000, "loss": 0.0601, "lr": 0.2403077934876452, "epoch": 0.5753304180001466, "percentage": 29.44, "elapsed_time": "12:19:43", "remaining_time": "1 day, 5:33:08", "throughput": 336.12, "total_tokens": 14918176} {"current_steps": 11780, "total_steps": 40000, "loss": 0.0553, "lr": 0.2402607535310918, "epoch": 0.5755747196638409, "percentage": 29.45, "elapsed_time": "12:19:46", "remaining_time": "1 day, 5:32:11", "throughput": 336.23, "total_tokens": 14924224} {"current_steps": 11785, "total_steps": 40000, "loss": 0.0604, "lr": 0.2402136996551959, "epoch": 0.5758190213275353, "percentage": 29.46, "elapsed_time": "12:19:49", "remaining_time": "1 day, 5:31:15", "throughput": 336.35, "total_tokens": 14930432} {"current_steps": 11790, "total_steps": 40000, "loss": 0.1036, "lr": 0.24016663186721376, "epoch": 0.5760633229912295, "percentage": 29.48, "elapsed_time": "12:19:53", "remaining_time": "1 day, 5:30:19", "throughput": 336.5, "total_tokens": 14938304} {"current_steps": 11795, "total_steps": 40000, "loss": 0.0702, "lr": 0.24011955017440395, "epoch": 0.5763076246549239, "percentage": 29.49, "elapsed_time": "12:19:56", "remaining_time": "1 day, 5:29:23", "throughput": 336.62, "total_tokens": 14944832} {"current_steps": 11800, "total_steps": 40000, "loss": 0.0248, "lr": 0.24007245458402696, "epoch": 0.5765519263186182, "percentage": 29.5, "elapsed_time": "12:19:59", "remaining_time": "1 day, 5:28:26", "throughput": 336.75, "total_tokens": 14951296} {"current_steps": 11800, "total_steps": 40000, "eval_loss": 0.07121576368808746, "epoch": 0.5765519263186182, "percentage": 29.5, "elapsed_time": "12:30:39", "remaining_time": "1 day, 5:53:56", "throughput": 331.96, "total_tokens": 14951296} {"current_steps": 11805, "total_steps": 40000, "loss": 0.0847, "lr": 0.2400253451033456, "epoch": 0.5767962279823126, "percentage": 29.51, "elapsed_time": "12:30:42", "remaining_time": "1 day, 5:53:00", "throughput": 332.07, "total_tokens": 14957312} {"current_steps": 11810, "total_steps": 40000, "loss": 0.0876, "lr": 0.23997822173962463, "epoch": 0.5770405296460069, "percentage": 29.53, "elapsed_time": "12:30:45", "remaining_time": "1 day, 5:52:02", "throughput": 332.18, "total_tokens": 14963520} {"current_steps": 11815, "total_steps": 40000, "loss": 0.0507, "lr": 0.23993108450013118, "epoch": 0.5772848313097012, "percentage": 29.54, "elapsed_time": "12:30:49", "remaining_time": "1 day, 5:51:05", "throughput": 332.31, "total_tokens": 14970176} {"current_steps": 11820, "total_steps": 40000, "loss": 0.097, "lr": 0.2398839333921343, "epoch": 0.5775291329733956, "percentage": 29.55, "elapsed_time": "12:30:52", "remaining_time": "1 day, 5:50:08", "throughput": 332.43, "total_tokens": 14976576} {"current_steps": 11825, "total_steps": 40000, "loss": 0.0742, "lr": 0.23983676842290536, "epoch": 0.5777734346370899, "percentage": 29.56, "elapsed_time": "12:30:55", "remaining_time": "1 day, 5:49:11", "throughput": 332.54, "total_tokens": 14982848} {"current_steps": 11830, "total_steps": 40000, "loss": 0.0305, "lr": 0.2397895895997178, "epoch": 0.5780177363007842, "percentage": 29.58, "elapsed_time": "12:30:58", "remaining_time": "1 day, 5:48:14", "throughput": 332.67, "total_tokens": 14989568} {"current_steps": 11835, "total_steps": 40000, "loss": 0.0766, "lr": 0.23974239692984714, "epoch": 0.5782620379644785, "percentage": 29.59, "elapsed_time": "12:31:01", "remaining_time": "1 day, 5:47:17", "throughput": 332.79, "total_tokens": 14996096} {"current_steps": 11840, "total_steps": 40000, "loss": 0.0546, "lr": 0.2396951904205711, "epoch": 0.5785063396281729, "percentage": 29.6, "elapsed_time": "12:31:04", "remaining_time": "1 day, 5:46:20", "throughput": 332.9, "total_tokens": 15002208} {"current_steps": 11845, "total_steps": 40000, "loss": 0.0555, "lr": 0.23964797007916952, "epoch": 0.5787506412918672, "percentage": 29.61, "elapsed_time": "12:31:07", "remaining_time": "1 day, 5:45:23", "throughput": 333.02, "total_tokens": 15008416} {"current_steps": 11850, "total_steps": 40000, "loss": 0.0826, "lr": 0.23960073591292436, "epoch": 0.5789949429555615, "percentage": 29.62, "elapsed_time": "12:31:10", "remaining_time": "1 day, 5:44:26", "throughput": 333.14, "total_tokens": 15014784} {"current_steps": 11855, "total_steps": 40000, "loss": 0.0833, "lr": 0.2395534879291197, "epoch": 0.5792392446192559, "percentage": 29.64, "elapsed_time": "12:31:13", "remaining_time": "1 day, 5:43:29", "throughput": 333.25, "total_tokens": 15020864} {"current_steps": 11860, "total_steps": 40000, "loss": 0.0743, "lr": 0.23950622613504186, "epoch": 0.5794835462829502, "percentage": 29.65, "elapsed_time": "12:31:16", "remaining_time": "1 day, 5:42:33", "throughput": 333.37, "total_tokens": 15027360} {"current_steps": 11865, "total_steps": 40000, "loss": 0.0716, "lr": 0.2394589505379791, "epoch": 0.5797278479466446, "percentage": 29.66, "elapsed_time": "12:31:20", "remaining_time": "1 day, 5:41:36", "throughput": 333.5, "total_tokens": 15034176} {"current_steps": 11870, "total_steps": 40000, "loss": 0.0647, "lr": 0.23941166114522197, "epoch": 0.5799721496103388, "percentage": 29.68, "elapsed_time": "12:31:23", "remaining_time": "1 day, 5:40:39", "throughput": 333.62, "total_tokens": 15040576} {"current_steps": 11875, "total_steps": 40000, "loss": 0.0727, "lr": 0.23936435796406308, "epoch": 0.5802164512740332, "percentage": 29.69, "elapsed_time": "12:31:26", "remaining_time": "1 day, 5:39:43", "throughput": 333.74, "total_tokens": 15047232} {"current_steps": 11880, "total_steps": 40000, "loss": 0.0744, "lr": 0.23931704100179715, "epoch": 0.5804607529377275, "percentage": 29.7, "elapsed_time": "12:31:29", "remaining_time": "1 day, 5:38:46", "throughput": 333.86, "total_tokens": 15053664} {"current_steps": 11885, "total_steps": 40000, "loss": 0.0556, "lr": 0.2392697102657211, "epoch": 0.5807050546014219, "percentage": 29.71, "elapsed_time": "12:31:32", "remaining_time": "1 day, 5:37:49", "throughput": 333.97, "total_tokens": 15059616} {"current_steps": 11890, "total_steps": 40000, "loss": 0.0636, "lr": 0.23922236576313388, "epoch": 0.5809493562651161, "percentage": 29.73, "elapsed_time": "12:31:35", "remaining_time": "1 day, 5:36:53", "throughput": 334.08, "total_tokens": 15065440} {"current_steps": 11895, "total_steps": 40000, "loss": 0.0718, "lr": 0.2391750075013366, "epoch": 0.5811936579288105, "percentage": 29.74, "elapsed_time": "12:31:38", "remaining_time": "1 day, 5:35:56", "throughput": 334.2, "total_tokens": 15071936} {"current_steps": 11900, "total_steps": 40000, "loss": 0.0482, "lr": 0.2391276354876326, "epoch": 0.5814379595925048, "percentage": 29.75, "elapsed_time": "12:31:41", "remaining_time": "1 day, 5:35:00", "throughput": 334.31, "total_tokens": 15078080} {"current_steps": 11905, "total_steps": 40000, "loss": 0.0505, "lr": 0.23908024972932707, "epoch": 0.5816822612561992, "percentage": 29.76, "elapsed_time": "12:31:44", "remaining_time": "1 day, 5:34:03", "throughput": 334.44, "total_tokens": 15084576} {"current_steps": 11910, "total_steps": 40000, "loss": 0.1184, "lr": 0.2390328502337276, "epoch": 0.5819265629198935, "percentage": 29.78, "elapsed_time": "12:31:47", "remaining_time": "1 day, 5:33:07", "throughput": 334.55, "total_tokens": 15090656} {"current_steps": 11915, "total_steps": 40000, "loss": 0.0528, "lr": 0.23898543700814376, "epoch": 0.5821708645835878, "percentage": 29.79, "elapsed_time": "12:31:50", "remaining_time": "1 day, 5:32:11", "throughput": 334.66, "total_tokens": 15096992} {"current_steps": 11920, "total_steps": 40000, "loss": 0.0862, "lr": 0.2389380100598873, "epoch": 0.5824151662472822, "percentage": 29.8, "elapsed_time": "12:31:53", "remaining_time": "1 day, 5:31:14", "throughput": 334.79, "total_tokens": 15103456} {"current_steps": 11925, "total_steps": 40000, "loss": 0.052, "lr": 0.23889056939627207, "epoch": 0.5826594679109764, "percentage": 29.81, "elapsed_time": "12:31:57", "remaining_time": "1 day, 5:30:19", "throughput": 334.92, "total_tokens": 15110400} {"current_steps": 11930, "total_steps": 40000, "loss": 0.0997, "lr": 0.23884311502461386, "epoch": 0.5829037695746708, "percentage": 29.83, "elapsed_time": "12:32:00", "remaining_time": "1 day, 5:29:22", "throughput": 335.03, "total_tokens": 15116640} {"current_steps": 11935, "total_steps": 40000, "loss": 0.075, "lr": 0.23879564695223088, "epoch": 0.5831480712383651, "percentage": 29.84, "elapsed_time": "12:32:03", "remaining_time": "1 day, 5:28:26", "throughput": 335.14, "total_tokens": 15122592} {"current_steps": 11940, "total_steps": 40000, "loss": 0.0591, "lr": 0.23874816518644332, "epoch": 0.5833923729020595, "percentage": 29.85, "elapsed_time": "12:32:06", "remaining_time": "1 day, 5:27:30", "throughput": 335.25, "total_tokens": 15128480} {"current_steps": 11945, "total_steps": 40000, "loss": 0.0795, "lr": 0.23870066973457335, "epoch": 0.5836366745657537, "percentage": 29.86, "elapsed_time": "12:32:09", "remaining_time": "1 day, 5:26:34", "throughput": 335.37, "total_tokens": 15135040} {"current_steps": 11950, "total_steps": 40000, "loss": 0.0777, "lr": 0.23865316060394545, "epoch": 0.5838809762294481, "percentage": 29.88, "elapsed_time": "12:32:12", "remaining_time": "1 day, 5:25:38", "throughput": 335.49, "total_tokens": 15141600} {"current_steps": 11955, "total_steps": 40000, "loss": 0.097, "lr": 0.2386056378018861, "epoch": 0.5841252778931425, "percentage": 29.89, "elapsed_time": "12:32:15", "remaining_time": "1 day, 5:24:42", "throughput": 335.6, "total_tokens": 15147392} {"current_steps": 11960, "total_steps": 40000, "loss": 0.0676, "lr": 0.2385581013357239, "epoch": 0.5843695795568368, "percentage": 29.9, "elapsed_time": "12:32:18", "remaining_time": "1 day, 5:23:46", "throughput": 335.71, "total_tokens": 15153504} {"current_steps": 11965, "total_steps": 40000, "loss": 0.0716, "lr": 0.23851055121278958, "epoch": 0.5846138812205312, "percentage": 29.91, "elapsed_time": "12:32:21", "remaining_time": "1 day, 5:22:50", "throughput": 335.83, "total_tokens": 15160032} {"current_steps": 11970, "total_steps": 40000, "loss": 0.0501, "lr": 0.23846298744041594, "epoch": 0.5848581828842254, "percentage": 29.93, "elapsed_time": "12:32:24", "remaining_time": "1 day, 5:21:54", "throughput": 335.95, "total_tokens": 15166368} {"current_steps": 11975, "total_steps": 40000, "loss": 0.0752, "lr": 0.23841541002593802, "epoch": 0.5851024845479198, "percentage": 29.94, "elapsed_time": "12:32:27", "remaining_time": "1 day, 5:20:58", "throughput": 336.07, "total_tokens": 15172576} {"current_steps": 11980, "total_steps": 40000, "loss": 0.0585, "lr": 0.23836781897669276, "epoch": 0.5853467862116141, "percentage": 29.95, "elapsed_time": "12:32:30", "remaining_time": "1 day, 5:20:03", "throughput": 336.19, "total_tokens": 15179040} {"current_steps": 11985, "total_steps": 40000, "loss": 0.0765, "lr": 0.23832021430001926, "epoch": 0.5855910878753084, "percentage": 29.96, "elapsed_time": "12:32:33", "remaining_time": "1 day, 5:19:07", "throughput": 336.31, "total_tokens": 15185600} {"current_steps": 11990, "total_steps": 40000, "loss": 0.0626, "lr": 0.2382725960032588, "epoch": 0.5858353895390027, "percentage": 29.98, "elapsed_time": "12:32:37", "remaining_time": "1 day, 5:18:11", "throughput": 336.43, "total_tokens": 15192096} {"current_steps": 11995, "total_steps": 40000, "loss": 0.0809, "lr": 0.23822496409375482, "epoch": 0.5860796912026971, "percentage": 29.99, "elapsed_time": "12:32:40", "remaining_time": "1 day, 5:17:16", "throughput": 336.55, "total_tokens": 15198560} {"current_steps": 12000, "total_steps": 40000, "loss": 0.0542, "lr": 0.2381773185788526, "epoch": 0.5863239928663915, "percentage": 30.0, "elapsed_time": "12:32:43", "remaining_time": "1 day, 5:16:21", "throughput": 336.67, "total_tokens": 15205152} {"current_steps": 12000, "total_steps": 40000, "eval_loss": 0.07154466211795807, "epoch": 0.5863239928663915, "percentage": 30.0, "elapsed_time": "12:43:23", "remaining_time": "1 day, 5:41:14", "throughput": 331.97, "total_tokens": 15205152} {"current_steps": 12005, "total_steps": 40000, "loss": 0.062, "lr": 0.2381296594658998, "epoch": 0.5865682945300857, "percentage": 30.01, "elapsed_time": "12:43:27", "remaining_time": "1 day, 5:40:20", "throughput": 332.08, "total_tokens": 15211840} {"current_steps": 12010, "total_steps": 40000, "loss": 0.0449, "lr": 0.238081986762246, "epoch": 0.5868125961937801, "percentage": 30.03, "elapsed_time": "12:43:30", "remaining_time": "1 day, 5:39:24", "throughput": 332.2, "total_tokens": 15218272} {"current_steps": 12015, "total_steps": 40000, "loss": 0.0969, "lr": 0.23803430047524293, "epoch": 0.5870568978574744, "percentage": 30.04, "elapsed_time": "12:43:33", "remaining_time": "1 day, 5:38:28", "throughput": 332.31, "total_tokens": 15224352} {"current_steps": 12020, "total_steps": 40000, "loss": 0.08, "lr": 0.23798660061224441, "epoch": 0.5873011995211688, "percentage": 30.05, "elapsed_time": "12:43:36", "remaining_time": "1 day, 5:37:31", "throughput": 332.43, "total_tokens": 15230688} {"current_steps": 12025, "total_steps": 40000, "loss": 0.0589, "lr": 0.23793888718060632, "epoch": 0.587545501184863, "percentage": 30.06, "elapsed_time": "12:43:39", "remaining_time": "1 day, 5:36:35", "throughput": 332.54, "total_tokens": 15236960} {"current_steps": 12030, "total_steps": 40000, "loss": 0.1068, "lr": 0.23789116018768675, "epoch": 0.5877898028485574, "percentage": 30.08, "elapsed_time": "12:43:42", "remaining_time": "1 day, 5:35:39", "throughput": 332.65, "total_tokens": 15243040} {"current_steps": 12035, "total_steps": 40000, "loss": 0.0655, "lr": 0.2378434196408458, "epoch": 0.5880341045122517, "percentage": 30.09, "elapsed_time": "12:43:46", "remaining_time": "1 day, 5:34:43", "throughput": 332.76, "total_tokens": 15249248} {"current_steps": 12040, "total_steps": 40000, "loss": 0.0635, "lr": 0.23779566554744563, "epoch": 0.5882784061759461, "percentage": 30.1, "elapsed_time": "12:43:49", "remaining_time": "1 day, 5:33:47", "throughput": 332.88, "total_tokens": 15255680} {"current_steps": 12045, "total_steps": 40000, "loss": 0.0606, "lr": 0.23774789791485051, "epoch": 0.5885227078396403, "percentage": 30.11, "elapsed_time": "12:43:52", "remaining_time": "1 day, 5:32:51", "throughput": 333.01, "total_tokens": 15262592} {"current_steps": 12050, "total_steps": 40000, "loss": 0.0756, "lr": 0.2377001167504268, "epoch": 0.5887670095033347, "percentage": 30.12, "elapsed_time": "12:43:55", "remaining_time": "1 day, 5:31:55", "throughput": 333.12, "total_tokens": 15268512} {"current_steps": 12055, "total_steps": 40000, "loss": 0.0624, "lr": 0.23765232206154302, "epoch": 0.5890113111670291, "percentage": 30.14, "elapsed_time": "12:43:58", "remaining_time": "1 day, 5:30:59", "throughput": 333.24, "total_tokens": 15275360} {"current_steps": 12060, "total_steps": 40000, "loss": 0.0363, "lr": 0.23760451385556966, "epoch": 0.5892556128307234, "percentage": 30.15, "elapsed_time": "12:44:01", "remaining_time": "1 day, 5:30:03", "throughput": 333.35, "total_tokens": 15281504} {"current_steps": 12065, "total_steps": 40000, "loss": 0.0491, "lr": 0.23755669213987932, "epoch": 0.5894999144944177, "percentage": 30.16, "elapsed_time": "12:44:04", "remaining_time": "1 day, 5:29:07", "throughput": 333.47, "total_tokens": 15287744} {"current_steps": 12070, "total_steps": 40000, "loss": 0.0874, "lr": 0.23750885692184676, "epoch": 0.589744216158112, "percentage": 30.18, "elapsed_time": "12:44:07", "remaining_time": "1 day, 5:28:11", "throughput": 333.58, "total_tokens": 15293952} {"current_steps": 12075, "total_steps": 40000, "loss": 0.043, "lr": 0.23746100820884875, "epoch": 0.5899885178218064, "percentage": 30.19, "elapsed_time": "12:44:10", "remaining_time": "1 day, 5:27:15", "throughput": 333.69, "total_tokens": 15300096} {"current_steps": 12080, "total_steps": 40000, "loss": 0.0606, "lr": 0.23741314600826421, "epoch": 0.5902328194855007, "percentage": 30.2, "elapsed_time": "12:44:13", "remaining_time": "1 day, 5:26:19", "throughput": 333.8, "total_tokens": 15305984} {"current_steps": 12085, "total_steps": 40000, "loss": 0.1121, "lr": 0.23736527032747406, "epoch": 0.590477121149195, "percentage": 30.21, "elapsed_time": "12:44:16", "remaining_time": "1 day, 5:25:24", "throughput": 333.91, "total_tokens": 15312224} {"current_steps": 12090, "total_steps": 40000, "loss": 0.0476, "lr": 0.23731738117386128, "epoch": 0.5907214228128893, "percentage": 30.23, "elapsed_time": "12:44:19", "remaining_time": "1 day, 5:24:28", "throughput": 334.03, "total_tokens": 15318400} {"current_steps": 12095, "total_steps": 40000, "loss": 0.0737, "lr": 0.237269478554811, "epoch": 0.5909657244765837, "percentage": 30.24, "elapsed_time": "12:44:23", "remaining_time": "1 day, 5:23:32", "throughput": 334.14, "total_tokens": 15324800} {"current_steps": 12100, "total_steps": 40000, "loss": 0.0605, "lr": 0.23722156247771053, "epoch": 0.5912100261402781, "percentage": 30.25, "elapsed_time": "12:44:26", "remaining_time": "1 day, 5:22:37", "throughput": 334.26, "total_tokens": 15331008} {"current_steps": 12105, "total_steps": 40000, "loss": 0.0978, "lr": 0.23717363294994895, "epoch": 0.5914543278039723, "percentage": 30.26, "elapsed_time": "12:44:29", "remaining_time": "1 day, 5:21:41", "throughput": 334.38, "total_tokens": 15337824} {"current_steps": 12110, "total_steps": 40000, "loss": 0.0573, "lr": 0.2371256899789177, "epoch": 0.5916986294676667, "percentage": 30.28, "elapsed_time": "12:44:32", "remaining_time": "1 day, 5:20:46", "throughput": 334.51, "total_tokens": 15344704} {"current_steps": 12115, "total_steps": 40000, "loss": 0.0506, "lr": 0.23707773357201017, "epoch": 0.591942931131361, "percentage": 30.29, "elapsed_time": "12:44:35", "remaining_time": "1 day, 5:19:51", "throughput": 334.62, "total_tokens": 15350976} {"current_steps": 12120, "total_steps": 40000, "loss": 0.0623, "lr": 0.2370297637366218, "epoch": 0.5921872327950554, "percentage": 30.3, "elapsed_time": "12:44:38", "remaining_time": "1 day, 5:18:55", "throughput": 334.74, "total_tokens": 15357472} {"current_steps": 12125, "total_steps": 40000, "loss": 0.0877, "lr": 0.23698178048015026, "epoch": 0.5924315344587496, "percentage": 30.31, "elapsed_time": "12:44:41", "remaining_time": "1 day, 5:18:00", "throughput": 334.85, "total_tokens": 15363296} {"current_steps": 12130, "total_steps": 40000, "loss": 0.0552, "lr": 0.236933783809995, "epoch": 0.592675836122444, "percentage": 30.33, "elapsed_time": "12:44:44", "remaining_time": "1 day, 5:17:04", "throughput": 334.96, "total_tokens": 15369632} {"current_steps": 12135, "total_steps": 40000, "loss": 0.0853, "lr": 0.23688577373355785, "epoch": 0.5929201377861383, "percentage": 30.34, "elapsed_time": "12:44:47", "remaining_time": "1 day, 5:16:09", "throughput": 335.08, "total_tokens": 15375840} {"current_steps": 12140, "total_steps": 40000, "loss": 0.0611, "lr": 0.23683775025824247, "epoch": 0.5931644394498327, "percentage": 30.35, "elapsed_time": "12:44:50", "remaining_time": "1 day, 5:15:14", "throughput": 335.19, "total_tokens": 15381888} {"current_steps": 12145, "total_steps": 40000, "loss": 0.0736, "lr": 0.2367897133914548, "epoch": 0.593408741113527, "percentage": 30.36, "elapsed_time": "12:44:53", "remaining_time": "1 day, 5:14:19", "throughput": 335.3, "total_tokens": 15388000} {"current_steps": 12150, "total_steps": 40000, "loss": 0.1136, "lr": 0.2367416631406026, "epoch": 0.5936530427772213, "percentage": 30.38, "elapsed_time": "12:44:56", "remaining_time": "1 day, 5:13:23", "throughput": 335.41, "total_tokens": 15394080} {"current_steps": 12155, "total_steps": 40000, "loss": 0.0597, "lr": 0.23669359951309588, "epoch": 0.5938973444409157, "percentage": 30.39, "elapsed_time": "12:44:59", "remaining_time": "1 day, 5:12:28", "throughput": 335.52, "total_tokens": 15400096} {"current_steps": 12160, "total_steps": 40000, "loss": 0.0817, "lr": 0.23664552251634666, "epoch": 0.59414164610461, "percentage": 30.4, "elapsed_time": "12:45:02", "remaining_time": "1 day, 5:11:33", "throughput": 335.63, "total_tokens": 15406272} {"current_steps": 12165, "total_steps": 40000, "loss": 0.0755, "lr": 0.23659743215776907, "epoch": 0.5943859477683043, "percentage": 30.41, "elapsed_time": "12:45:05", "remaining_time": "1 day, 5:10:38", "throughput": 335.74, "total_tokens": 15412480} {"current_steps": 12170, "total_steps": 40000, "loss": 0.0451, "lr": 0.23654932844477908, "epoch": 0.5946302494319986, "percentage": 30.43, "elapsed_time": "12:45:09", "remaining_time": "1 day, 5:09:43", "throughput": 335.86, "total_tokens": 15418976} {"current_steps": 12175, "total_steps": 40000, "loss": 0.1028, "lr": 0.23650121138479507, "epoch": 0.594874551095693, "percentage": 30.44, "elapsed_time": "12:45:12", "remaining_time": "1 day, 5:08:48", "throughput": 335.97, "total_tokens": 15425312} {"current_steps": 12180, "total_steps": 40000, "loss": 0.0485, "lr": 0.23645308098523724, "epoch": 0.5951188527593873, "percentage": 30.45, "elapsed_time": "12:45:15", "remaining_time": "1 day, 5:07:53", "throughput": 336.08, "total_tokens": 15431232} {"current_steps": 12185, "total_steps": 40000, "loss": 0.115, "lr": 0.23640493725352785, "epoch": 0.5953631544230816, "percentage": 30.46, "elapsed_time": "12:45:18", "remaining_time": "1 day, 5:06:58", "throughput": 336.2, "total_tokens": 15437920} {"current_steps": 12190, "total_steps": 40000, "loss": 0.045, "lr": 0.2363567801970913, "epoch": 0.5956074560867759, "percentage": 30.48, "elapsed_time": "12:45:21", "remaining_time": "1 day, 5:06:04", "throughput": 336.33, "total_tokens": 15444576} {"current_steps": 12195, "total_steps": 40000, "loss": 0.0842, "lr": 0.236308609823354, "epoch": 0.5958517577504703, "percentage": 30.49, "elapsed_time": "12:45:24", "remaining_time": "1 day, 5:05:09", "throughput": 336.44, "total_tokens": 15450784} {"current_steps": 12200, "total_steps": 40000, "loss": 0.0666, "lr": 0.23626042613974452, "epoch": 0.5960960594141647, "percentage": 30.5, "elapsed_time": "12:45:27", "remaining_time": "1 day, 5:04:15", "throughput": 336.57, "total_tokens": 15457696} {"current_steps": 12200, "total_steps": 40000, "eval_loss": 0.06986404210329056, "epoch": 0.5960960594141647, "percentage": 30.5, "elapsed_time": "12:56:06", "remaining_time": "1 day, 5:28:30", "throughput": 331.95, "total_tokens": 15457696} {"current_steps": 12205, "total_steps": 40000, "loss": 0.0682, "lr": 0.23621222915369325, "epoch": 0.5963403610778589, "percentage": 30.51, "elapsed_time": "12:56:10", "remaining_time": "1 day, 5:27:37", "throughput": 332.06, "total_tokens": 15464384} {"current_steps": 12210, "total_steps": 40000, "loss": 0.1104, "lr": 0.23616401887263283, "epoch": 0.5965846627415533, "percentage": 30.53, "elapsed_time": "12:56:13", "remaining_time": "1 day, 5:26:42", "throughput": 332.17, "total_tokens": 15470624} {"current_steps": 12215, "total_steps": 40000, "loss": 0.0724, "lr": 0.23611579530399793, "epoch": 0.5968289644052476, "percentage": 30.54, "elapsed_time": "12:56:16", "remaining_time": "1 day, 5:25:46", "throughput": 332.29, "total_tokens": 15477120} {"current_steps": 12220, "total_steps": 40000, "loss": 0.0433, "lr": 0.23606755845522517, "epoch": 0.597073266068942, "percentage": 30.55, "elapsed_time": "12:56:20", "remaining_time": "1 day, 5:24:51", "throughput": 332.41, "total_tokens": 15483552} {"current_steps": 12225, "total_steps": 40000, "loss": 0.076, "lr": 0.23601930833375329, "epoch": 0.5973175677326362, "percentage": 30.56, "elapsed_time": "12:56:23", "remaining_time": "1 day, 5:23:56", "throughput": 332.52, "total_tokens": 15489920} {"current_steps": 12230, "total_steps": 40000, "loss": 0.1066, "lr": 0.23597104494702312, "epoch": 0.5975618693963306, "percentage": 30.58, "elapsed_time": "12:56:26", "remaining_time": "1 day, 5:23:00", "throughput": 332.63, "total_tokens": 15496096} {"current_steps": 12235, "total_steps": 40000, "loss": 0.06, "lr": 0.23592276830247744, "epoch": 0.5978061710600249, "percentage": 30.59, "elapsed_time": "12:56:29", "remaining_time": "1 day, 5:22:05", "throughput": 332.75, "total_tokens": 15502528} {"current_steps": 12240, "total_steps": 40000, "loss": 0.0731, "lr": 0.2358744784075611, "epoch": 0.5980504727237193, "percentage": 30.6, "elapsed_time": "12:56:32", "remaining_time": "1 day, 5:21:10", "throughput": 332.87, "total_tokens": 15509216} {"current_steps": 12245, "total_steps": 40000, "loss": 0.083, "lr": 0.235826175269721, "epoch": 0.5982947743874136, "percentage": 30.61, "elapsed_time": "12:56:35", "remaining_time": "1 day, 5:20:15", "throughput": 332.98, "total_tokens": 15515296} {"current_steps": 12250, "total_steps": 40000, "loss": 0.0445, "lr": 0.23577785889640612, "epoch": 0.5985390760511079, "percentage": 30.63, "elapsed_time": "12:56:38", "remaining_time": "1 day, 5:19:20", "throughput": 333.09, "total_tokens": 15521440} {"current_steps": 12255, "total_steps": 40000, "loss": 0.0681, "lr": 0.23572952929506744, "epoch": 0.5987833777148023, "percentage": 30.64, "elapsed_time": "12:56:41", "remaining_time": "1 day, 5:18:25", "throughput": 333.2, "total_tokens": 15527840} {"current_steps": 12260, "total_steps": 40000, "loss": 0.0781, "lr": 0.23568118647315803, "epoch": 0.5990276793784965, "percentage": 30.65, "elapsed_time": "12:56:44", "remaining_time": "1 day, 5:17:29", "throughput": 333.31, "total_tokens": 15533600} {"current_steps": 12265, "total_steps": 40000, "loss": 0.0656, "lr": 0.23563283043813296, "epoch": 0.5992719810421909, "percentage": 30.66, "elapsed_time": "12:56:47", "remaining_time": "1 day, 5:16:34", "throughput": 333.42, "total_tokens": 15540000} {"current_steps": 12270, "total_steps": 40000, "loss": 0.0589, "lr": 0.23558446119744922, "epoch": 0.5995162827058852, "percentage": 30.68, "elapsed_time": "12:56:50", "remaining_time": "1 day, 5:15:39", "throughput": 333.53, "total_tokens": 15546144} {"current_steps": 12275, "total_steps": 40000, "loss": 0.0605, "lr": 0.23553607875856608, "epoch": 0.5997605843695796, "percentage": 30.69, "elapsed_time": "12:56:53", "remaining_time": "1 day, 5:14:44", "throughput": 333.64, "total_tokens": 15552192} {"current_steps": 12280, "total_steps": 40000, "loss": 0.0987, "lr": 0.2354876831289447, "epoch": 0.6000048860332738, "percentage": 30.7, "elapsed_time": "12:56:57", "remaining_time": "1 day, 5:13:49", "throughput": 333.75, "total_tokens": 15558464} {"current_steps": 12285, "total_steps": 40000, "loss": 0.1073, "lr": 0.23543927431604827, "epoch": 0.6002491876969682, "percentage": 30.71, "elapsed_time": "12:57:00", "remaining_time": "1 day, 5:12:55", "throughput": 333.86, "total_tokens": 15564640} {"current_steps": 12290, "total_steps": 40000, "loss": 0.0872, "lr": 0.23539085232734203, "epoch": 0.6004934893606625, "percentage": 30.73, "elapsed_time": "12:57:03", "remaining_time": "1 day, 5:12:00", "throughput": 333.97, "total_tokens": 15570624} {"current_steps": 12295, "total_steps": 40000, "loss": 0.0821, "lr": 0.2353424171702933, "epoch": 0.6007377910243569, "percentage": 30.74, "elapsed_time": "12:57:06", "remaining_time": "1 day, 5:11:05", "throughput": 334.08, "total_tokens": 15577088} {"current_steps": 12300, "total_steps": 40000, "loss": 0.1121, "lr": 0.23529396885237133, "epoch": 0.6009820926880513, "percentage": 30.75, "elapsed_time": "12:57:09", "remaining_time": "1 day, 5:10:10", "throughput": 334.19, "total_tokens": 15583232} {"current_steps": 12305, "total_steps": 40000, "loss": 0.082, "lr": 0.2352455073810475, "epoch": 0.6012263943517455, "percentage": 30.76, "elapsed_time": "12:57:12", "remaining_time": "1 day, 5:09:16", "throughput": 334.32, "total_tokens": 15589952} {"current_steps": 12310, "total_steps": 40000, "loss": 0.0826, "lr": 0.23519703276379517, "epoch": 0.6014706960154399, "percentage": 30.78, "elapsed_time": "12:57:15", "remaining_time": "1 day, 5:08:21", "throughput": 334.43, "total_tokens": 15596160} {"current_steps": 12315, "total_steps": 40000, "loss": 0.0603, "lr": 0.2351485450080897, "epoch": 0.6017149976791342, "percentage": 30.79, "elapsed_time": "12:57:18", "remaining_time": "1 day, 5:07:26", "throughput": 334.54, "total_tokens": 15602272} {"current_steps": 12320, "total_steps": 40000, "loss": 0.0856, "lr": 0.2351000441214086, "epoch": 0.6019592993428285, "percentage": 30.8, "elapsed_time": "12:57:21", "remaining_time": "1 day, 5:06:31", "throughput": 334.65, "total_tokens": 15608384} {"current_steps": 12325, "total_steps": 40000, "loss": 0.0442, "lr": 0.23505153011123125, "epoch": 0.6022036010065228, "percentage": 30.81, "elapsed_time": "12:57:24", "remaining_time": "1 day, 5:05:37", "throughput": 334.77, "total_tokens": 15615360} {"current_steps": 12330, "total_steps": 40000, "loss": 0.0604, "lr": 0.23500300298503912, "epoch": 0.6024479026702172, "percentage": 30.83, "elapsed_time": "12:57:27", "remaining_time": "1 day, 5:04:43", "throughput": 334.89, "total_tokens": 15621856} {"current_steps": 12335, "total_steps": 40000, "loss": 0.0421, "lr": 0.23495446275031576, "epoch": 0.6026922043339115, "percentage": 30.84, "elapsed_time": "12:57:30", "remaining_time": "1 day, 5:03:48", "throughput": 334.99, "total_tokens": 15627776} {"current_steps": 12340, "total_steps": 40000, "loss": 0.052, "lr": 0.2349059094145466, "epoch": 0.6029365059976058, "percentage": 30.85, "elapsed_time": "12:57:34", "remaining_time": "1 day, 5:02:54", "throughput": 335.12, "total_tokens": 15634752} {"current_steps": 12345, "total_steps": 40000, "loss": 0.0649, "lr": 0.2348573429852192, "epoch": 0.6031808076613002, "percentage": 30.86, "elapsed_time": "12:57:37", "remaining_time": "1 day, 5:01:59", "throughput": 335.23, "total_tokens": 15640672} {"current_steps": 12350, "total_steps": 40000, "loss": 0.0801, "lr": 0.23480876346982313, "epoch": 0.6034251093249945, "percentage": 30.88, "elapsed_time": "12:57:40", "remaining_time": "1 day, 5:01:05", "throughput": 335.34, "total_tokens": 15647136} {"current_steps": 12355, "total_steps": 40000, "loss": 0.1117, "lr": 0.23476017087585, "epoch": 0.6036694109886889, "percentage": 30.89, "elapsed_time": "12:57:43", "remaining_time": "1 day, 5:00:11", "throughput": 335.46, "total_tokens": 15653600} {"current_steps": 12360, "total_steps": 40000, "loss": 0.0972, "lr": 0.23471156521079334, "epoch": 0.6039137126523831, "percentage": 30.9, "elapsed_time": "12:57:46", "remaining_time": "1 day, 4:59:17", "throughput": 335.57, "total_tokens": 15659936} {"current_steps": 12365, "total_steps": 40000, "loss": 0.097, "lr": 0.23466294648214875, "epoch": 0.6041580143160775, "percentage": 30.91, "elapsed_time": "12:57:49", "remaining_time": "1 day, 4:58:23", "throughput": 335.7, "total_tokens": 15666976} {"current_steps": 12370, "total_steps": 40000, "loss": 0.0669, "lr": 0.2346143146974139, "epoch": 0.6044023159797718, "percentage": 30.93, "elapsed_time": "12:57:52", "remaining_time": "1 day, 4:57:29", "throughput": 335.81, "total_tokens": 15673088} {"current_steps": 12375, "total_steps": 40000, "loss": 0.0655, "lr": 0.23456566986408836, "epoch": 0.6046466176434662, "percentage": 30.94, "elapsed_time": "12:57:55", "remaining_time": "1 day, 4:56:35", "throughput": 335.92, "total_tokens": 15679296} {"current_steps": 12380, "total_steps": 40000, "loss": 0.0571, "lr": 0.23451701198967384, "epoch": 0.6048909193071604, "percentage": 30.95, "elapsed_time": "12:57:58", "remaining_time": "1 day, 4:55:40", "throughput": 336.03, "total_tokens": 15685216} {"current_steps": 12385, "total_steps": 40000, "loss": 0.0973, "lr": 0.23446834108167397, "epoch": 0.6051352209708548, "percentage": 30.96, "elapsed_time": "12:58:01", "remaining_time": "1 day, 4:54:46", "throughput": 336.14, "total_tokens": 15691424} {"current_steps": 12390, "total_steps": 40000, "loss": 0.0541, "lr": 0.23441965714759438, "epoch": 0.6053795226345492, "percentage": 30.98, "elapsed_time": "12:58:04", "remaining_time": "1 day, 4:53:53", "throughput": 336.25, "total_tokens": 15697760} {"current_steps": 12395, "total_steps": 40000, "loss": 0.0659, "lr": 0.23437096019494277, "epoch": 0.6056238242982435, "percentage": 30.99, "elapsed_time": "12:58:07", "remaining_time": "1 day, 4:52:58", "throughput": 336.36, "total_tokens": 15703904} {"current_steps": 12400, "total_steps": 40000, "loss": 0.0825, "lr": 0.23432225023122885, "epoch": 0.6058681259619378, "percentage": 31.0, "elapsed_time": "12:58:10", "remaining_time": "1 day, 4:52:04", "throughput": 336.47, "total_tokens": 15709984} {"current_steps": 12400, "total_steps": 40000, "eval_loss": 0.06982379406690598, "epoch": 0.6058681259619378, "percentage": 31.0, "elapsed_time": "13:08:50", "remaining_time": "1 day, 5:15:49", "throughput": 331.92, "total_tokens": 15709984} {"current_steps": 12405, "total_steps": 40000, "loss": 0.064, "lr": 0.23427352726396428, "epoch": 0.6061124276256321, "percentage": 31.01, "elapsed_time": "13:08:55", "remaining_time": "1 day, 5:14:58", "throughput": 332.01, "total_tokens": 15716064} {"current_steps": 12410, "total_steps": 40000, "loss": 0.0642, "lr": 0.2342247913006628, "epoch": 0.6063567292893265, "percentage": 31.03, "elapsed_time": "13:08:58", "remaining_time": "1 day, 5:14:04", "throughput": 332.12, "total_tokens": 15722368} {"current_steps": 12415, "total_steps": 40000, "loss": 0.0812, "lr": 0.23417604234883999, "epoch": 0.6066010309530208, "percentage": 31.04, "elapsed_time": "13:09:02", "remaining_time": "1 day, 5:13:09", "throughput": 332.23, "total_tokens": 15728512} {"current_steps": 12420, "total_steps": 40000, "loss": 0.0526, "lr": 0.23412728041601363, "epoch": 0.6068453326167151, "percentage": 31.05, "elapsed_time": "13:09:05", "remaining_time": "1 day, 5:12:15", "throughput": 332.35, "total_tokens": 15735200} {"current_steps": 12425, "total_steps": 40000, "loss": 0.0682, "lr": 0.23407850550970347, "epoch": 0.6070896342804094, "percentage": 31.06, "elapsed_time": "13:09:08", "remaining_time": "1 day, 5:11:20", "throughput": 332.47, "total_tokens": 15741760} {"current_steps": 12430, "total_steps": 40000, "loss": 0.049, "lr": 0.23402971763743116, "epoch": 0.6073339359441038, "percentage": 31.08, "elapsed_time": "13:09:11", "remaining_time": "1 day, 5:10:26", "throughput": 332.58, "total_tokens": 15748032} {"current_steps": 12435, "total_steps": 40000, "loss": 0.0606, "lr": 0.23398091680672037, "epoch": 0.607578237607798, "percentage": 31.09, "elapsed_time": "13:09:14", "remaining_time": "1 day, 5:09:31", "throughput": 332.69, "total_tokens": 15754528} {"current_steps": 12440, "total_steps": 40000, "loss": 0.052, "lr": 0.23393210302509687, "epoch": 0.6078225392714924, "percentage": 31.1, "elapsed_time": "13:09:17", "remaining_time": "1 day, 5:08:37", "throughput": 332.81, "total_tokens": 15760992} {"current_steps": 12445, "total_steps": 40000, "loss": 0.0424, "lr": 0.23388327630008832, "epoch": 0.6080668409351868, "percentage": 31.11, "elapsed_time": "13:09:20", "remaining_time": "1 day, 5:07:43", "throughput": 332.93, "total_tokens": 15767808} {"current_steps": 12450, "total_steps": 40000, "loss": 0.0864, "lr": 0.23383443663922443, "epoch": 0.6083111425988811, "percentage": 31.13, "elapsed_time": "13:09:23", "remaining_time": "1 day, 5:06:49", "throughput": 333.05, "total_tokens": 15774304} {"current_steps": 12455, "total_steps": 40000, "loss": 0.0539, "lr": 0.23378558405003685, "epoch": 0.6085554442625755, "percentage": 31.14, "elapsed_time": "13:09:26", "remaining_time": "1 day, 5:05:54", "throughput": 333.15, "total_tokens": 15780032} {"current_steps": 12460, "total_steps": 40000, "loss": 0.0536, "lr": 0.2337367185400593, "epoch": 0.6087997459262697, "percentage": 31.15, "elapsed_time": "13:09:29", "remaining_time": "1 day, 5:05:00", "throughput": 333.26, "total_tokens": 15786528} {"current_steps": 12465, "total_steps": 40000, "loss": 0.0748, "lr": 0.23368784011682747, "epoch": 0.6090440475899641, "percentage": 31.16, "elapsed_time": "13:09:32", "remaining_time": "1 day, 5:04:05", "throughput": 333.36, "total_tokens": 15792288} {"current_steps": 12470, "total_steps": 40000, "loss": 0.0584, "lr": 0.23363894878787902, "epoch": 0.6092883492536584, "percentage": 31.18, "elapsed_time": "13:09:35", "remaining_time": "1 day, 5:03:11", "throughput": 333.48, "total_tokens": 15798880} {"current_steps": 12475, "total_steps": 40000, "loss": 0.117, "lr": 0.23359004456075352, "epoch": 0.6095326509173528, "percentage": 31.19, "elapsed_time": "13:09:39", "remaining_time": "1 day, 5:02:17", "throughput": 333.59, "total_tokens": 15805376} {"current_steps": 12480, "total_steps": 40000, "loss": 0.0609, "lr": 0.23354112744299277, "epoch": 0.609776952581047, "percentage": 31.2, "elapsed_time": "13:09:42", "remaining_time": "1 day, 5:01:23", "throughput": 333.7, "total_tokens": 15811616} {"current_steps": 12485, "total_steps": 40000, "loss": 0.0556, "lr": 0.2334921974421403, "epoch": 0.6100212542447414, "percentage": 31.21, "elapsed_time": "13:09:45", "remaining_time": "1 day, 5:00:29", "throughput": 333.81, "total_tokens": 15817728} {"current_steps": 12490, "total_steps": 40000, "loss": 0.096, "lr": 0.23344325456574178, "epoch": 0.6102655559084358, "percentage": 31.23, "elapsed_time": "13:09:48", "remaining_time": "1 day, 4:59:35", "throughput": 333.92, "total_tokens": 15824064} {"current_steps": 12495, "total_steps": 40000, "loss": 0.0873, "lr": 0.23339429882134477, "epoch": 0.61050985757213, "percentage": 31.24, "elapsed_time": "13:09:51", "remaining_time": "1 day, 4:58:41", "throughput": 334.03, "total_tokens": 15830240} {"current_steps": 12500, "total_steps": 40000, "loss": 0.0684, "lr": 0.23334533021649884, "epoch": 0.6107541592358244, "percentage": 31.25, "elapsed_time": "13:09:54", "remaining_time": "1 day, 4:57:48", "throughput": 334.16, "total_tokens": 15837376} {"current_steps": 12505, "total_steps": 40000, "loss": 0.0474, "lr": 0.23329634875875566, "epoch": 0.6109984608995187, "percentage": 31.26, "elapsed_time": "13:09:57", "remaining_time": "1 day, 4:56:53", "throughput": 334.26, "total_tokens": 15843232} {"current_steps": 12510, "total_steps": 40000, "loss": 0.0828, "lr": 0.23324735445566874, "epoch": 0.6112427625632131, "percentage": 31.27, "elapsed_time": "13:10:00", "remaining_time": "1 day, 4:56:00", "throughput": 334.38, "total_tokens": 15849760} {"current_steps": 12515, "total_steps": 40000, "loss": 0.0668, "lr": 0.2331983473147936, "epoch": 0.6114870642269074, "percentage": 31.29, "elapsed_time": "13:10:03", "remaining_time": "1 day, 4:55:06", "throughput": 334.5, "total_tokens": 15856416} {"current_steps": 12520, "total_steps": 40000, "loss": 0.0751, "lr": 0.23314932734368776, "epoch": 0.6117313658906017, "percentage": 31.3, "elapsed_time": "13:10:06", "remaining_time": "1 day, 4:54:13", "throughput": 334.61, "total_tokens": 15863072} {"current_steps": 12525, "total_steps": 40000, "loss": 0.0545, "lr": 0.2331002945499107, "epoch": 0.611975667554296, "percentage": 31.31, "elapsed_time": "13:10:10", "remaining_time": "1 day, 4:53:19", "throughput": 334.72, "total_tokens": 15869280} {"current_steps": 12530, "total_steps": 40000, "loss": 0.0803, "lr": 0.23305124894102397, "epoch": 0.6122199692179904, "percentage": 31.32, "elapsed_time": "13:10:13", "remaining_time": "1 day, 4:52:25", "throughput": 334.84, "total_tokens": 15875744} {"current_steps": 12535, "total_steps": 40000, "loss": 0.0778, "lr": 0.23300219052459092, "epoch": 0.6124642708816848, "percentage": 31.34, "elapsed_time": "13:10:16", "remaining_time": "1 day, 4:51:31", "throughput": 334.94, "total_tokens": 15881696} {"current_steps": 12540, "total_steps": 40000, "loss": 0.0854, "lr": 0.23295311930817708, "epoch": 0.612708572545379, "percentage": 31.35, "elapsed_time": "13:10:19", "remaining_time": "1 day, 4:50:38", "throughput": 335.05, "total_tokens": 15888032} {"current_steps": 12545, "total_steps": 40000, "loss": 0.0657, "lr": 0.23290403529934972, "epoch": 0.6129528742090734, "percentage": 31.36, "elapsed_time": "13:10:22", "remaining_time": "1 day, 4:49:44", "throughput": 335.17, "total_tokens": 15894336} {"current_steps": 12550, "total_steps": 40000, "loss": 0.0867, "lr": 0.23285493850567832, "epoch": 0.6131971758727677, "percentage": 31.37, "elapsed_time": "13:10:25", "remaining_time": "1 day, 4:48:51", "throughput": 335.27, "total_tokens": 15900256} {"current_steps": 12555, "total_steps": 40000, "loss": 0.0649, "lr": 0.23280582893473414, "epoch": 0.613441477536462, "percentage": 31.39, "elapsed_time": "13:10:28", "remaining_time": "1 day, 4:47:57", "throughput": 335.38, "total_tokens": 15906560} {"current_steps": 12560, "total_steps": 40000, "loss": 0.0431, "lr": 0.2327567065940906, "epoch": 0.6136857792001563, "percentage": 31.4, "elapsed_time": "13:10:31", "remaining_time": "1 day, 4:47:04", "throughput": 335.5, "total_tokens": 15913120} {"current_steps": 12565, "total_steps": 40000, "loss": 0.0738, "lr": 0.23270757149132285, "epoch": 0.6139300808638507, "percentage": 31.41, "elapsed_time": "13:10:34", "remaining_time": "1 day, 4:46:10", "throughput": 335.61, "total_tokens": 15919392} {"current_steps": 12570, "total_steps": 40000, "loss": 0.0626, "lr": 0.23265842363400827, "epoch": 0.614174382527545, "percentage": 31.42, "elapsed_time": "13:10:37", "remaining_time": "1 day, 4:45:18", "throughput": 335.73, "total_tokens": 15926336} {"current_steps": 12575, "total_steps": 40000, "loss": 0.0734, "lr": 0.23260926302972595, "epoch": 0.6144186841912394, "percentage": 31.44, "elapsed_time": "13:10:40", "remaining_time": "1 day, 4:44:24", "throughput": 335.84, "total_tokens": 15932672} {"current_steps": 12580, "total_steps": 40000, "loss": 0.0511, "lr": 0.2325600896860572, "epoch": 0.6146629858549336, "percentage": 31.45, "elapsed_time": "13:10:44", "remaining_time": "1 day, 4:43:31", "throughput": 335.95, "total_tokens": 15939040} {"current_steps": 12585, "total_steps": 40000, "loss": 0.0612, "lr": 0.23251090361058505, "epoch": 0.614907287518628, "percentage": 31.46, "elapsed_time": "13:10:47", "remaining_time": "1 day, 4:42:38", "throughput": 336.07, "total_tokens": 15945376} {"current_steps": 12590, "total_steps": 40000, "loss": 0.0661, "lr": 0.23246170481089476, "epoch": 0.6151515891823224, "percentage": 31.47, "elapsed_time": "13:10:50", "remaining_time": "1 day, 4:41:45", "throughput": 336.18, "total_tokens": 15951712} {"current_steps": 12595, "total_steps": 40000, "loss": 0.0514, "lr": 0.23241249329457317, "epoch": 0.6153958908460166, "percentage": 31.49, "elapsed_time": "13:10:53", "remaining_time": "1 day, 4:40:51", "throughput": 336.29, "total_tokens": 15958080} {"current_steps": 12600, "total_steps": 40000, "loss": 0.0511, "lr": 0.23236326906920957, "epoch": 0.615640192509711, "percentage": 31.5, "elapsed_time": "13:10:56", "remaining_time": "1 day, 4:39:58", "throughput": 336.4, "total_tokens": 15964384} {"current_steps": 12600, "total_steps": 40000, "eval_loss": 0.07337065786123276, "epoch": 0.615640192509711, "percentage": 31.5, "elapsed_time": "13:21:36", "remaining_time": "1 day, 5:03:10", "throughput": 331.92, "total_tokens": 15964384} {"current_steps": 12605, "total_steps": 40000, "loss": 0.0808, "lr": 0.2323140321423948, "epoch": 0.6158844941734053, "percentage": 31.51, "elapsed_time": "13:21:40", "remaining_time": "1 day, 5:02:18", "throughput": 332.03, "total_tokens": 15970528} {"current_steps": 12610, "total_steps": 40000, "loss": 0.0717, "lr": 0.23226478252172184, "epoch": 0.6161287958370997, "percentage": 31.52, "elapsed_time": "13:21:43", "remaining_time": "1 day, 5:01:24", "throughput": 332.13, "total_tokens": 15976608} {"current_steps": 12615, "total_steps": 40000, "loss": 0.061, "lr": 0.23221552021478561, "epoch": 0.6163730975007939, "percentage": 31.54, "elapsed_time": "13:21:46", "remaining_time": "1 day, 5:00:30", "throughput": 332.24, "total_tokens": 15982976} {"current_steps": 12620, "total_steps": 40000, "loss": 0.0489, "lr": 0.232166245229183, "epoch": 0.6166173991644883, "percentage": 31.55, "elapsed_time": "13:21:49", "remaining_time": "1 day, 4:59:36", "throughput": 332.35, "total_tokens": 15989024} {"current_steps": 12625, "total_steps": 40000, "loss": 0.0611, "lr": 0.2321169575725128, "epoch": 0.6168617008281826, "percentage": 31.56, "elapsed_time": "13:21:52", "remaining_time": "1 day, 4:58:43", "throughput": 332.46, "total_tokens": 15995456} {"current_steps": 12630, "total_steps": 40000, "loss": 0.0936, "lr": 0.23206765725237577, "epoch": 0.617106002491877, "percentage": 31.57, "elapsed_time": "13:21:55", "remaining_time": "1 day, 4:57:49", "throughput": 332.56, "total_tokens": 16001408} {"current_steps": 12635, "total_steps": 40000, "loss": 0.0661, "lr": 0.2320183442763747, "epoch": 0.6173503041555713, "percentage": 31.59, "elapsed_time": "13:21:58", "remaining_time": "1 day, 4:56:55", "throughput": 332.67, "total_tokens": 16007680} {"current_steps": 12640, "total_steps": 40000, "loss": 0.061, "lr": 0.23196901865211422, "epoch": 0.6175946058192656, "percentage": 31.6, "elapsed_time": "13:22:01", "remaining_time": "1 day, 4:56:02", "throughput": 332.8, "total_tokens": 16014784} {"current_steps": 12645, "total_steps": 40000, "loss": 0.0755, "lr": 0.231919680387201, "epoch": 0.61783890748296, "percentage": 31.61, "elapsed_time": "13:22:04", "remaining_time": "1 day, 4:55:08", "throughput": 332.9, "total_tokens": 16020992} {"current_steps": 12650, "total_steps": 40000, "loss": 0.0689, "lr": 0.23187032948924358, "epoch": 0.6180832091466543, "percentage": 31.62, "elapsed_time": "13:22:08", "remaining_time": "1 day, 4:54:15", "throughput": 333.02, "total_tokens": 16027584} {"current_steps": 12655, "total_steps": 40000, "loss": 0.1022, "lr": 0.23182096596585247, "epoch": 0.6183275108103486, "percentage": 31.64, "elapsed_time": "13:22:11", "remaining_time": "1 day, 4:53:22", "throughput": 333.13, "total_tokens": 16034112} {"current_steps": 12660, "total_steps": 40000, "loss": 0.058, "lr": 0.23177158982464025, "epoch": 0.6185718124740429, "percentage": 31.65, "elapsed_time": "13:22:14", "remaining_time": "1 day, 4:52:28", "throughput": 333.25, "total_tokens": 16040672} {"current_steps": 12665, "total_steps": 40000, "loss": 0.0717, "lr": 0.23172220107322122, "epoch": 0.6188161141377373, "percentage": 31.66, "elapsed_time": "13:22:17", "remaining_time": "1 day, 4:51:35", "throughput": 333.35, "total_tokens": 16046784} {"current_steps": 12670, "total_steps": 40000, "loss": 0.0599, "lr": 0.23167279971921184, "epoch": 0.6190604158014316, "percentage": 31.67, "elapsed_time": "13:22:20", "remaining_time": "1 day, 4:50:41", "throughput": 333.46, "total_tokens": 16052640} {"current_steps": 12675, "total_steps": 40000, "loss": 0.0907, "lr": 0.23162338577023034, "epoch": 0.6193047174651259, "percentage": 31.69, "elapsed_time": "13:22:23", "remaining_time": "1 day, 4:49:48", "throughput": 333.57, "total_tokens": 16058976} {"current_steps": 12680, "total_steps": 40000, "loss": 0.0455, "lr": 0.23157395923389704, "epoch": 0.6195490191288203, "percentage": 31.7, "elapsed_time": "13:22:26", "remaining_time": "1 day, 4:48:55", "throughput": 333.68, "total_tokens": 16065536} {"current_steps": 12685, "total_steps": 40000, "loss": 0.0955, "lr": 0.2315245201178341, "epoch": 0.6197933207925146, "percentage": 31.71, "elapsed_time": "13:22:29", "remaining_time": "1 day, 4:48:02", "throughput": 333.79, "total_tokens": 16071744} {"current_steps": 12690, "total_steps": 40000, "loss": 0.0563, "lr": 0.23147506842966564, "epoch": 0.620037622456209, "percentage": 31.72, "elapsed_time": "13:22:32", "remaining_time": "1 day, 4:47:09", "throughput": 333.9, "total_tokens": 16078336} {"current_steps": 12695, "total_steps": 40000, "loss": 0.0463, "lr": 0.23142560417701774, "epoch": 0.6202819241199032, "percentage": 31.74, "elapsed_time": "13:22:35", "remaining_time": "1 day, 4:46:15", "throughput": 334.01, "total_tokens": 16084448} {"current_steps": 12700, "total_steps": 40000, "loss": 0.0691, "lr": 0.23137612736751845, "epoch": 0.6205262257835976, "percentage": 31.75, "elapsed_time": "13:22:38", "remaining_time": "1 day, 4:45:22", "throughput": 334.12, "total_tokens": 16090912} {"current_steps": 12705, "total_steps": 40000, "loss": 0.0615, "lr": 0.23132663800879766, "epoch": 0.6207705274472919, "percentage": 31.76, "elapsed_time": "13:22:41", "remaining_time": "1 day, 4:44:29", "throughput": 334.22, "total_tokens": 16096640} {"current_steps": 12710, "total_steps": 40000, "loss": 0.082, "lr": 0.2312771361084873, "epoch": 0.6210148291109863, "percentage": 31.77, "elapsed_time": "13:22:45", "remaining_time": "1 day, 4:43:36", "throughput": 334.33, "total_tokens": 16103040} {"current_steps": 12715, "total_steps": 40000, "loss": 0.0661, "lr": 0.23122762167422112, "epoch": 0.6212591307746805, "percentage": 31.79, "elapsed_time": "13:22:48", "remaining_time": "1 day, 4:42:43", "throughput": 334.44, "total_tokens": 16109120} {"current_steps": 12720, "total_steps": 40000, "loss": 0.0759, "lr": 0.23117809471363493, "epoch": 0.6215034324383749, "percentage": 31.8, "elapsed_time": "13:22:51", "remaining_time": "1 day, 4:41:50", "throughput": 334.55, "total_tokens": 16115520} {"current_steps": 12725, "total_steps": 40000, "loss": 0.078, "lr": 0.23112855523436637, "epoch": 0.6217477341020692, "percentage": 31.81, "elapsed_time": "13:22:54", "remaining_time": "1 day, 4:40:57", "throughput": 334.65, "total_tokens": 16121312} {"current_steps": 12730, "total_steps": 40000, "loss": 0.0662, "lr": 0.23107900324405511, "epoch": 0.6219920357657636, "percentage": 31.82, "elapsed_time": "13:22:57", "remaining_time": "1 day, 4:40:04", "throughput": 334.76, "total_tokens": 16127616} {"current_steps": 12735, "total_steps": 40000, "loss": 0.0698, "lr": 0.2310294387503426, "epoch": 0.6222363374294579, "percentage": 31.84, "elapsed_time": "13:23:00", "remaining_time": "1 day, 4:39:11", "throughput": 334.87, "total_tokens": 16133984} {"current_steps": 12740, "total_steps": 40000, "loss": 0.0883, "lr": 0.23097986176087237, "epoch": 0.6224806390931522, "percentage": 31.85, "elapsed_time": "13:23:03", "remaining_time": "1 day, 4:38:18", "throughput": 334.98, "total_tokens": 16140288} {"current_steps": 12745, "total_steps": 40000, "loss": 0.0902, "lr": 0.23093027228328986, "epoch": 0.6227249407568466, "percentage": 31.86, "elapsed_time": "13:23:06", "remaining_time": "1 day, 4:37:25", "throughput": 335.08, "total_tokens": 16146240} {"current_steps": 12750, "total_steps": 40000, "loss": 0.0647, "lr": 0.23088067032524226, "epoch": 0.6229692424205409, "percentage": 31.87, "elapsed_time": "13:23:09", "remaining_time": "1 day, 4:36:33", "throughput": 335.19, "total_tokens": 16152512} {"current_steps": 12755, "total_steps": 40000, "loss": 0.1071, "lr": 0.23083105589437888, "epoch": 0.6232135440842352, "percentage": 31.89, "elapsed_time": "13:23:12", "remaining_time": "1 day, 4:35:40", "throughput": 335.3, "total_tokens": 16159168} {"current_steps": 12760, "total_steps": 40000, "loss": 0.0703, "lr": 0.23078142899835094, "epoch": 0.6234578457479295, "percentage": 31.9, "elapsed_time": "13:23:15", "remaining_time": "1 day, 4:34:47", "throughput": 335.41, "total_tokens": 16165472} {"current_steps": 12765, "total_steps": 40000, "loss": 0.08, "lr": 0.23073178964481147, "epoch": 0.6237021474116239, "percentage": 31.91, "elapsed_time": "13:23:18", "remaining_time": "1 day, 4:33:55", "throughput": 335.53, "total_tokens": 16172224} {"current_steps": 12770, "total_steps": 40000, "loss": 0.0639, "lr": 0.2306821378414155, "epoch": 0.6239464490753182, "percentage": 31.92, "elapsed_time": "13:23:21", "remaining_time": "1 day, 4:33:02", "throughput": 335.65, "total_tokens": 16178816} {"current_steps": 12775, "total_steps": 40000, "loss": 0.0634, "lr": 0.2306324735958199, "epoch": 0.6241907507390125, "percentage": 31.94, "elapsed_time": "13:23:25", "remaining_time": "1 day, 4:32:10", "throughput": 335.76, "total_tokens": 16185248} {"current_steps": 12780, "total_steps": 40000, "loss": 0.0433, "lr": 0.23058279691568362, "epoch": 0.6244350524027069, "percentage": 31.95, "elapsed_time": "13:23:28", "remaining_time": "1 day, 4:31:17", "throughput": 335.86, "total_tokens": 16191232} {"current_steps": 12785, "total_steps": 40000, "loss": 0.0572, "lr": 0.23053310780866745, "epoch": 0.6246793540664012, "percentage": 31.96, "elapsed_time": "13:23:31", "remaining_time": "1 day, 4:30:25", "throughput": 335.97, "total_tokens": 16197568} {"current_steps": 12790, "total_steps": 40000, "loss": 0.0545, "lr": 0.23048340628243397, "epoch": 0.6249236557300956, "percentage": 31.97, "elapsed_time": "13:23:34", "remaining_time": "1 day, 4:29:32", "throughput": 336.08, "total_tokens": 16203744} {"current_steps": 12795, "total_steps": 40000, "loss": 0.0898, "lr": 0.23043369234464783, "epoch": 0.6251679573937898, "percentage": 31.99, "elapsed_time": "13:23:37", "remaining_time": "1 day, 4:28:40", "throughput": 336.19, "total_tokens": 16210272} {"current_steps": 12800, "total_steps": 40000, "loss": 0.0501, "lr": 0.2303839660029755, "epoch": 0.6254122590574842, "percentage": 32.0, "elapsed_time": "13:23:40", "remaining_time": "1 day, 4:27:48", "throughput": 336.3, "total_tokens": 16216768} {"current_steps": 12800, "total_steps": 40000, "eval_loss": 0.07034800946712494, "epoch": 0.6254122590574842, "percentage": 32.0, "elapsed_time": "13:34:20", "remaining_time": "1 day, 4:50:27", "throughput": 331.9, "total_tokens": 16216768} {"current_steps": 12805, "total_steps": 40000, "loss": 0.0612, "lr": 0.23033422726508548, "epoch": 0.6256565607211785, "percentage": 32.01, "elapsed_time": "13:34:24", "remaining_time": "1 day, 4:49:36", "throughput": 332.0, "total_tokens": 16222880} {"current_steps": 12810, "total_steps": 40000, "loss": 0.0602, "lr": 0.23028447613864808, "epoch": 0.6259008623848729, "percentage": 32.02, "elapsed_time": "13:34:27", "remaining_time": "1 day, 4:48:43", "throughput": 332.1, "total_tokens": 16228832} {"current_steps": 12815, "total_steps": 40000, "loss": 0.0533, "lr": 0.2302347126313355, "epoch": 0.6261451640485671, "percentage": 32.04, "elapsed_time": "13:34:30", "remaining_time": "1 day, 4:47:50", "throughput": 332.21, "total_tokens": 16234944} {"current_steps": 12820, "total_steps": 40000, "loss": 0.084, "lr": 0.23018493675082197, "epoch": 0.6263894657122615, "percentage": 32.05, "elapsed_time": "13:34:33", "remaining_time": "1 day, 4:46:57", "throughput": 332.32, "total_tokens": 16241600} {"current_steps": 12825, "total_steps": 40000, "loss": 0.0409, "lr": 0.2301351485047835, "epoch": 0.6266337673759559, "percentage": 32.06, "elapsed_time": "13:34:36", "remaining_time": "1 day, 4:46:04", "throughput": 332.43, "total_tokens": 16247936} {"current_steps": 12830, "total_steps": 40000, "loss": 0.085, "lr": 0.23008534790089813, "epoch": 0.6268780690396502, "percentage": 32.07, "elapsed_time": "13:34:39", "remaining_time": "1 day, 4:45:11", "throughput": 332.53, "total_tokens": 16253984} {"current_steps": 12835, "total_steps": 40000, "loss": 0.0612, "lr": 0.2300355349468457, "epoch": 0.6271223707033445, "percentage": 32.09, "elapsed_time": "13:34:42", "remaining_time": "1 day, 4:44:18", "throughput": 332.63, "total_tokens": 16259968} {"current_steps": 12840, "total_steps": 40000, "loss": 0.0903, "lr": 0.22998570965030793, "epoch": 0.6273666723670388, "percentage": 32.1, "elapsed_time": "13:34:45", "remaining_time": "1 day, 4:43:25", "throughput": 332.74, "total_tokens": 16266208} {"current_steps": 12845, "total_steps": 40000, "loss": 0.0683, "lr": 0.22993587201896862, "epoch": 0.6276109740307332, "percentage": 32.11, "elapsed_time": "13:34:48", "remaining_time": "1 day, 4:42:32", "throughput": 332.84, "total_tokens": 16272000} {"current_steps": 12850, "total_steps": 40000, "loss": 0.051, "lr": 0.2298860220605133, "epoch": 0.6278552756944275, "percentage": 32.12, "elapsed_time": "13:34:51", "remaining_time": "1 day, 4:41:40", "throughput": 332.94, "total_tokens": 16278144} {"current_steps": 12855, "total_steps": 40000, "loss": 0.0718, "lr": 0.22983615978262942, "epoch": 0.6280995773581218, "percentage": 32.14, "elapsed_time": "13:34:54", "remaining_time": "1 day, 4:40:47", "throughput": 333.06, "total_tokens": 16284896} {"current_steps": 12860, "total_steps": 40000, "loss": 0.0473, "lr": 0.22978628519300648, "epoch": 0.6283438790218161, "percentage": 32.15, "elapsed_time": "13:34:57", "remaining_time": "1 day, 4:39:54", "throughput": 333.17, "total_tokens": 16291200} {"current_steps": 12865, "total_steps": 40000, "loss": 0.0821, "lr": 0.22973639829933568, "epoch": 0.6285881806855105, "percentage": 32.16, "elapsed_time": "13:35:00", "remaining_time": "1 day, 4:39:02", "throughput": 333.27, "total_tokens": 16297280} {"current_steps": 12870, "total_steps": 40000, "loss": 0.0416, "lr": 0.22968649910931027, "epoch": 0.6288324823492047, "percentage": 32.17, "elapsed_time": "13:35:03", "remaining_time": "1 day, 4:38:09", "throughput": 333.38, "total_tokens": 16303616} {"current_steps": 12875, "total_steps": 40000, "loss": 0.0528, "lr": 0.22963658763062528, "epoch": 0.6290767840128991, "percentage": 32.19, "elapsed_time": "13:35:07", "remaining_time": "1 day, 4:37:17", "throughput": 333.49, "total_tokens": 16309984} {"current_steps": 12880, "total_steps": 40000, "loss": 0.0557, "lr": 0.22958666387097765, "epoch": 0.6293210856765935, "percentage": 32.2, "elapsed_time": "13:35:10", "remaining_time": "1 day, 4:36:24", "throughput": 333.59, "total_tokens": 16315872} {"current_steps": 12885, "total_steps": 40000, "loss": 0.0664, "lr": 0.22953672783806633, "epoch": 0.6295653873402878, "percentage": 32.21, "elapsed_time": "13:35:13", "remaining_time": "1 day, 4:35:32", "throughput": 333.7, "total_tokens": 16322208} {"current_steps": 12890, "total_steps": 40000, "loss": 0.0892, "lr": 0.22948677953959207, "epoch": 0.6298096890039822, "percentage": 32.23, "elapsed_time": "13:35:16", "remaining_time": "1 day, 4:34:39", "throughput": 333.81, "total_tokens": 16328608} {"current_steps": 12895, "total_steps": 40000, "loss": 0.102, "lr": 0.2294368189832575, "epoch": 0.6300539906676764, "percentage": 32.24, "elapsed_time": "13:35:19", "remaining_time": "1 day, 4:33:47", "throughput": 333.91, "total_tokens": 16334880} {"current_steps": 12900, "total_steps": 40000, "loss": 0.0597, "lr": 0.2293868461767672, "epoch": 0.6302982923313708, "percentage": 32.25, "elapsed_time": "13:35:22", "remaining_time": "1 day, 4:32:55", "throughput": 334.03, "total_tokens": 16341504} {"current_steps": 12905, "total_steps": 40000, "loss": 0.0768, "lr": 0.22933686112782758, "epoch": 0.6305425939950651, "percentage": 32.26, "elapsed_time": "13:35:25", "remaining_time": "1 day, 4:32:02", "throughput": 334.13, "total_tokens": 16347712} {"current_steps": 12910, "total_steps": 40000, "loss": 0.0949, "lr": 0.22928686384414698, "epoch": 0.6307868956587595, "percentage": 32.27, "elapsed_time": "13:35:28", "remaining_time": "1 day, 4:31:10", "throughput": 334.26, "total_tokens": 16354816} {"current_steps": 12915, "total_steps": 40000, "loss": 0.0618, "lr": 0.22923685433343552, "epoch": 0.6310311973224537, "percentage": 32.29, "elapsed_time": "13:35:31", "remaining_time": "1 day, 4:30:18", "throughput": 334.36, "total_tokens": 16360896} {"current_steps": 12920, "total_steps": 40000, "loss": 0.0673, "lr": 0.22918683260340542, "epoch": 0.6312754989861481, "percentage": 32.3, "elapsed_time": "13:35:34", "remaining_time": "1 day, 4:29:26", "throughput": 334.47, "total_tokens": 16367360} {"current_steps": 12925, "total_steps": 40000, "loss": 0.0598, "lr": 0.2291367986617706, "epoch": 0.6315198006498425, "percentage": 32.31, "elapsed_time": "13:35:37", "remaining_time": "1 day, 4:28:34", "throughput": 334.58, "total_tokens": 16373728} {"current_steps": 12930, "total_steps": 40000, "loss": 0.0649, "lr": 0.22908675251624697, "epoch": 0.6317641023135367, "percentage": 32.32, "elapsed_time": "13:35:41", "remaining_time": "1 day, 4:27:42", "throughput": 334.69, "total_tokens": 16380032} {"current_steps": 12935, "total_steps": 40000, "loss": 0.074, "lr": 0.22903669417455216, "epoch": 0.6320084039772311, "percentage": 32.34, "elapsed_time": "13:35:44", "remaining_time": "1 day, 4:26:49", "throughput": 334.8, "total_tokens": 16386272} {"current_steps": 12940, "total_steps": 40000, "loss": 0.0882, "lr": 0.22898662364440592, "epoch": 0.6322527056409254, "percentage": 32.35, "elapsed_time": "13:35:47", "remaining_time": "1 day, 4:25:57", "throughput": 334.9, "total_tokens": 16392512} {"current_steps": 12945, "total_steps": 40000, "loss": 0.076, "lr": 0.2289365409335297, "epoch": 0.6324970073046198, "percentage": 32.36, "elapsed_time": "13:35:50", "remaining_time": "1 day, 4:25:06", "throughput": 335.01, "total_tokens": 16399040} {"current_steps": 12950, "total_steps": 40000, "loss": 0.0894, "lr": 0.2288864460496469, "epoch": 0.632741308968314, "percentage": 32.38, "elapsed_time": "13:35:53", "remaining_time": "1 day, 4:24:13", "throughput": 335.12, "total_tokens": 16405280} {"current_steps": 12955, "total_steps": 40000, "loss": 0.0631, "lr": 0.22883633900048272, "epoch": 0.6329856106320084, "percentage": 32.39, "elapsed_time": "13:35:56", "remaining_time": "1 day, 4:23:22", "throughput": 335.23, "total_tokens": 16411776} {"current_steps": 12960, "total_steps": 40000, "loss": 0.0812, "lr": 0.2287862197937644, "epoch": 0.6332299122957027, "percentage": 32.4, "elapsed_time": "13:35:59", "remaining_time": "1 day, 4:22:30", "throughput": 335.33, "total_tokens": 16417632} {"current_steps": 12965, "total_steps": 40000, "loss": 0.0814, "lr": 0.2287360884372209, "epoch": 0.6334742139593971, "percentage": 32.41, "elapsed_time": "13:36:02", "remaining_time": "1 day, 4:21:38", "throughput": 335.44, "total_tokens": 16424096} {"current_steps": 12970, "total_steps": 40000, "loss": 0.0508, "lr": 0.22868594493858307, "epoch": 0.6337185156230913, "percentage": 32.42, "elapsed_time": "13:36:05", "remaining_time": "1 day, 4:20:46", "throughput": 335.55, "total_tokens": 16430208} {"current_steps": 12975, "total_steps": 40000, "loss": 0.0665, "lr": 0.2286357893055837, "epoch": 0.6339628172867857, "percentage": 32.44, "elapsed_time": "13:36:08", "remaining_time": "1 day, 4:19:54", "throughput": 335.64, "total_tokens": 16435872} {"current_steps": 12980, "total_steps": 40000, "loss": 0.0756, "lr": 0.22858562154595746, "epoch": 0.6342071189504801, "percentage": 32.45, "elapsed_time": "13:36:11", "remaining_time": "1 day, 4:19:02", "throughput": 335.76, "total_tokens": 16442656} {"current_steps": 12985, "total_steps": 40000, "loss": 0.0593, "lr": 0.22853544166744078, "epoch": 0.6344514206141744, "percentage": 32.46, "elapsed_time": "13:36:14", "remaining_time": "1 day, 4:18:11", "throughput": 335.87, "total_tokens": 16449376} {"current_steps": 12990, "total_steps": 40000, "loss": 0.0696, "lr": 0.22848524967777206, "epoch": 0.6346957222778687, "percentage": 32.48, "elapsed_time": "13:36:18", "remaining_time": "1 day, 4:17:20", "throughput": 336.0, "total_tokens": 16456640} {"current_steps": 12995, "total_steps": 40000, "loss": 0.0595, "lr": 0.22843504558469152, "epoch": 0.634940023941563, "percentage": 32.49, "elapsed_time": "13:36:21", "remaining_time": "1 day, 4:16:28", "throughput": 336.11, "total_tokens": 16463392} {"current_steps": 13000, "total_steps": 40000, "loss": 0.0689, "lr": 0.2283848293959413, "epoch": 0.6351843256052574, "percentage": 32.5, "elapsed_time": "13:36:24", "remaining_time": "1 day, 4:15:37", "throughput": 336.22, "total_tokens": 16469792} {"current_steps": 13000, "total_steps": 40000, "eval_loss": 0.07054082304239273, "epoch": 0.6351843256052574, "percentage": 32.5, "elapsed_time": "13:47:04", "remaining_time": "1 day, 4:37:46", "throughput": 331.89, "total_tokens": 16469792} {"current_steps": 13005, "total_steps": 40000, "loss": 0.0573, "lr": 0.22833460111926532, "epoch": 0.6354286272689517, "percentage": 32.51, "elapsed_time": "13:47:08", "remaining_time": "1 day, 4:36:55", "throughput": 332.0, "total_tokens": 16476448} {"current_steps": 13010, "total_steps": 40000, "loss": 0.1068, "lr": 0.22828436076240946, "epoch": 0.635672928932646, "percentage": 32.52, "elapsed_time": "13:47:11", "remaining_time": "1 day, 4:36:03", "throughput": 332.11, "total_tokens": 16483200} {"current_steps": 13015, "total_steps": 40000, "loss": 0.0616, "lr": 0.22823410833312135, "epoch": 0.6359172305963403, "percentage": 32.54, "elapsed_time": "13:47:14", "remaining_time": "1 day, 4:35:11", "throughput": 332.22, "total_tokens": 16489600} {"current_steps": 13020, "total_steps": 40000, "loss": 0.0997, "lr": 0.2281838438391506, "epoch": 0.6361615322600347, "percentage": 32.55, "elapsed_time": "13:47:17", "remaining_time": "1 day, 4:34:19", "throughput": 332.32, "total_tokens": 16495776} {"current_steps": 13025, "total_steps": 40000, "loss": 0.0742, "lr": 0.22813356728824863, "epoch": 0.6364058339237291, "percentage": 32.56, "elapsed_time": "13:47:20", "remaining_time": "1 day, 4:33:26", "throughput": 332.43, "total_tokens": 16502016} {"current_steps": 13030, "total_steps": 40000, "loss": 0.0788, "lr": 0.2280832786881687, "epoch": 0.6366501355874233, "percentage": 32.57, "elapsed_time": "13:47:23", "remaining_time": "1 day, 4:32:34", "throughput": 332.53, "total_tokens": 16508032} {"current_steps": 13035, "total_steps": 40000, "loss": 0.0774, "lr": 0.22803297804666592, "epoch": 0.6368944372511177, "percentage": 32.59, "elapsed_time": "13:47:26", "remaining_time": "1 day, 4:31:42", "throughput": 332.64, "total_tokens": 16514368} {"current_steps": 13040, "total_steps": 40000, "loss": 0.052, "lr": 0.22798266537149728, "epoch": 0.637138738914812, "percentage": 32.6, "elapsed_time": "13:47:29", "remaining_time": "1 day, 4:30:50", "throughput": 332.74, "total_tokens": 16520256} {"current_steps": 13045, "total_steps": 40000, "loss": 0.0377, "lr": 0.22793234067042167, "epoch": 0.6373830405785064, "percentage": 32.61, "elapsed_time": "13:47:33", "remaining_time": "1 day, 4:29:58", "throughput": 332.85, "total_tokens": 16526944} {"current_steps": 13050, "total_steps": 40000, "loss": 0.0961, "lr": 0.22788200395119979, "epoch": 0.6376273422422006, "percentage": 32.62, "elapsed_time": "13:47:36", "remaining_time": "1 day, 4:29:06", "throughput": 332.95, "total_tokens": 16532800} {"current_steps": 13055, "total_steps": 40000, "loss": 0.0561, "lr": 0.2278316552215942, "epoch": 0.637871643905895, "percentage": 32.64, "elapsed_time": "13:47:39", "remaining_time": "1 day, 4:28:14", "throughput": 333.05, "total_tokens": 16539008} {"current_steps": 13060, "total_steps": 40000, "loss": 0.081, "lr": 0.22778129448936918, "epoch": 0.6381159455695893, "percentage": 32.65, "elapsed_time": "13:47:42", "remaining_time": "1 day, 4:27:22", "throughput": 333.16, "total_tokens": 16545504} {"current_steps": 13065, "total_steps": 40000, "loss": 0.0749, "lr": 0.22773092176229118, "epoch": 0.6383602472332837, "percentage": 32.66, "elapsed_time": "13:47:45", "remaining_time": "1 day, 4:26:30", "throughput": 333.27, "total_tokens": 16551904} {"current_steps": 13070, "total_steps": 40000, "loss": 0.0431, "lr": 0.22768053704812816, "epoch": 0.638604548896978, "percentage": 32.67, "elapsed_time": "13:47:48", "remaining_time": "1 day, 4:25:38", "throughput": 333.38, "total_tokens": 16558400} {"current_steps": 13075, "total_steps": 40000, "loss": 0.0689, "lr": 0.22763014035465018, "epoch": 0.6388488505606723, "percentage": 32.69, "elapsed_time": "13:47:51", "remaining_time": "1 day, 4:24:47", "throughput": 333.49, "total_tokens": 16564864} {"current_steps": 13080, "total_steps": 40000, "loss": 0.0881, "lr": 0.22757973168962892, "epoch": 0.6390931522243667, "percentage": 32.7, "elapsed_time": "13:47:54", "remaining_time": "1 day, 4:23:55", "throughput": 333.59, "total_tokens": 16570880} {"current_steps": 13085, "total_steps": 40000, "loss": 0.072, "lr": 0.22752931106083818, "epoch": 0.639337453888061, "percentage": 32.71, "elapsed_time": "13:47:57", "remaining_time": "1 day, 4:23:03", "throughput": 333.69, "total_tokens": 16577152} {"current_steps": 13090, "total_steps": 40000, "loss": 0.0894, "lr": 0.22747887847605341, "epoch": 0.6395817555517553, "percentage": 32.73, "elapsed_time": "13:48:00", "remaining_time": "1 day, 4:22:11", "throughput": 333.8, "total_tokens": 16583200} {"current_steps": 13095, "total_steps": 40000, "loss": 0.0733, "lr": 0.22742843394305184, "epoch": 0.6398260572154496, "percentage": 32.74, "elapsed_time": "13:48:03", "remaining_time": "1 day, 4:21:20", "throughput": 333.9, "total_tokens": 16589632} {"current_steps": 13100, "total_steps": 40000, "loss": 0.0423, "lr": 0.22737797746961272, "epoch": 0.640070358879144, "percentage": 32.75, "elapsed_time": "13:48:06", "remaining_time": "1 day, 4:20:28", "throughput": 334.02, "total_tokens": 16596288} {"current_steps": 13105, "total_steps": 40000, "loss": 0.0591, "lr": 0.22732750906351712, "epoch": 0.6403146605428383, "percentage": 32.76, "elapsed_time": "13:48:10", "remaining_time": "1 day, 4:19:37", "throughput": 334.12, "total_tokens": 16602432} {"current_steps": 13110, "total_steps": 40000, "loss": 0.1155, "lr": 0.22727702873254785, "epoch": 0.6405589622065326, "percentage": 32.77, "elapsed_time": "13:48:13", "remaining_time": "1 day, 4:18:45", "throughput": 334.22, "total_tokens": 16608544} {"current_steps": 13115, "total_steps": 40000, "loss": 0.0628, "lr": 0.22722653648448968, "epoch": 0.6408032638702269, "percentage": 32.79, "elapsed_time": "13:48:16", "remaining_time": "1 day, 4:17:54", "throughput": 334.32, "total_tokens": 16614560} {"current_steps": 13120, "total_steps": 40000, "loss": 0.097, "lr": 0.22717603232712902, "epoch": 0.6410475655339213, "percentage": 32.8, "elapsed_time": "13:48:19", "remaining_time": "1 day, 4:17:02", "throughput": 334.43, "total_tokens": 16620672} {"current_steps": 13125, "total_steps": 40000, "loss": 0.0639, "lr": 0.22712551626825436, "epoch": 0.6412918671976157, "percentage": 32.81, "elapsed_time": "13:48:22", "remaining_time": "1 day, 4:16:11", "throughput": 334.54, "total_tokens": 16627360} {"current_steps": 13130, "total_steps": 40000, "loss": 0.0558, "lr": 0.2270749883156559, "epoch": 0.6415361688613099, "percentage": 32.82, "elapsed_time": "13:48:25", "remaining_time": "1 day, 4:15:20", "throughput": 334.64, "total_tokens": 16633568} {"current_steps": 13135, "total_steps": 40000, "loss": 0.0774, "lr": 0.22702444847712563, "epoch": 0.6417804705250043, "percentage": 32.84, "elapsed_time": "13:48:28", "remaining_time": "1 day, 4:14:28", "throughput": 334.74, "total_tokens": 16639456} {"current_steps": 13140, "total_steps": 40000, "loss": 0.0623, "lr": 0.22697389676045743, "epoch": 0.6420247721886986, "percentage": 32.85, "elapsed_time": "13:48:31", "remaining_time": "1 day, 4:13:37", "throughput": 334.84, "total_tokens": 16645632} {"current_steps": 13145, "total_steps": 40000, "loss": 0.0735, "lr": 0.22692333317344704, "epoch": 0.642269073852393, "percentage": 32.86, "elapsed_time": "13:48:34", "remaining_time": "1 day, 4:12:45", "throughput": 334.94, "total_tokens": 16651520} {"current_steps": 13150, "total_steps": 40000, "loss": 0.0811, "lr": 0.22687275772389198, "epoch": 0.6425133755160872, "percentage": 32.88, "elapsed_time": "13:48:37", "remaining_time": "1 day, 4:11:54", "throughput": 335.06, "total_tokens": 16658176} {"current_steps": 13155, "total_steps": 40000, "loss": 0.0508, "lr": 0.22682217041959168, "epoch": 0.6427576771797816, "percentage": 32.89, "elapsed_time": "13:48:40", "remaining_time": "1 day, 4:11:03", "throughput": 335.17, "total_tokens": 16665056} {"current_steps": 13160, "total_steps": 40000, "loss": 0.0678, "lr": 0.2267715712683473, "epoch": 0.6430019788434759, "percentage": 32.9, "elapsed_time": "13:48:43", "remaining_time": "1 day, 4:10:12", "throughput": 335.27, "total_tokens": 16671136} {"current_steps": 13165, "total_steps": 40000, "loss": 0.0786, "lr": 0.22672096027796182, "epoch": 0.6432462805071703, "percentage": 32.91, "elapsed_time": "13:48:47", "remaining_time": "1 day, 4:09:21", "throughput": 335.39, "total_tokens": 16677728} {"current_steps": 13170, "total_steps": 40000, "loss": 0.08, "lr": 0.22667033745624016, "epoch": 0.6434905821708646, "percentage": 32.92, "elapsed_time": "13:48:50", "remaining_time": "1 day, 4:08:30", "throughput": 335.49, "total_tokens": 16684192} {"current_steps": 13175, "total_steps": 40000, "loss": 0.0842, "lr": 0.22661970281098895, "epoch": 0.6437348838345589, "percentage": 32.94, "elapsed_time": "13:48:53", "remaining_time": "1 day, 4:07:39", "throughput": 335.59, "total_tokens": 16690016} {"current_steps": 13180, "total_steps": 40000, "loss": 0.0646, "lr": 0.22656905635001667, "epoch": 0.6439791854982533, "percentage": 32.95, "elapsed_time": "13:48:56", "remaining_time": "1 day, 4:06:48", "throughput": 335.7, "total_tokens": 16696320} {"current_steps": 13185, "total_steps": 40000, "loss": 0.0836, "lr": 0.2265183980811337, "epoch": 0.6442234871619476, "percentage": 32.96, "elapsed_time": "13:48:59", "remaining_time": "1 day, 4:05:57", "throughput": 335.8, "total_tokens": 16702464} {"current_steps": 13190, "total_steps": 40000, "loss": 0.0947, "lr": 0.22646772801215218, "epoch": 0.6444677888256419, "percentage": 32.98, "elapsed_time": "13:49:02", "remaining_time": "1 day, 4:05:06", "throughput": 335.91, "total_tokens": 16708832} {"current_steps": 13195, "total_steps": 40000, "loss": 0.062, "lr": 0.22641704615088598, "epoch": 0.6447120904893362, "percentage": 32.99, "elapsed_time": "13:49:05", "remaining_time": "1 day, 4:04:15", "throughput": 336.02, "total_tokens": 16715392} {"current_steps": 13200, "total_steps": 40000, "loss": 0.0738, "lr": 0.22636635250515103, "epoch": 0.6449563921530306, "percentage": 33.0, "elapsed_time": "13:49:08", "remaining_time": "1 day, 4:03:24", "throughput": 336.12, "total_tokens": 16721536} {"current_steps": 13200, "total_steps": 40000, "eval_loss": 0.07069843262434006, "epoch": 0.6449563921530306, "percentage": 33.0, "elapsed_time": "13:59:48", "remaining_time": "1 day, 4:25:04", "throughput": 331.85, "total_tokens": 16721536} {"current_steps": 13205, "total_steps": 40000, "loss": 0.0616, "lr": 0.2263156470827648, "epoch": 0.6452006938167248, "percentage": 33.01, "elapsed_time": "13:59:52", "remaining_time": "1 day, 4:24:14", "throughput": 331.95, "total_tokens": 16727840} {"current_steps": 13210, "total_steps": 40000, "loss": 0.0451, "lr": 0.22626492989154678, "epoch": 0.6454449954804192, "percentage": 33.02, "elapsed_time": "13:59:55", "remaining_time": "1 day, 4:23:22", "throughput": 332.06, "total_tokens": 16734400} {"current_steps": 13215, "total_steps": 40000, "loss": 0.0448, "lr": 0.22621420093931813, "epoch": 0.6456892971441136, "percentage": 33.04, "elapsed_time": "13:59:58", "remaining_time": "1 day, 4:22:31", "throughput": 332.17, "total_tokens": 16740704} {"current_steps": 13220, "total_steps": 40000, "loss": 0.0714, "lr": 0.22616346023390194, "epoch": 0.6459335988078079, "percentage": 33.05, "elapsed_time": "14:00:01", "remaining_time": "1 day, 4:21:39", "throughput": 332.27, "total_tokens": 16746880} {"current_steps": 13225, "total_steps": 40000, "loss": 0.049, "lr": 0.22611270778312306, "epoch": 0.6461779004715023, "percentage": 33.06, "elapsed_time": "14:00:04", "remaining_time": "1 day, 4:20:48", "throughput": 332.37, "total_tokens": 16752896} {"current_steps": 13230, "total_steps": 40000, "loss": 0.0911, "lr": 0.2260619435948081, "epoch": 0.6464222021351965, "percentage": 33.07, "elapsed_time": "14:00:07", "remaining_time": "1 day, 4:19:56", "throughput": 332.48, "total_tokens": 16759552} {"current_steps": 13235, "total_steps": 40000, "loss": 0.0421, "lr": 0.22601116767678567, "epoch": 0.6466665037988909, "percentage": 33.09, "elapsed_time": "14:00:11", "remaining_time": "1 day, 4:19:05", "throughput": 332.59, "total_tokens": 16766016} {"current_steps": 13240, "total_steps": 40000, "loss": 0.0713, "lr": 0.2259603800368859, "epoch": 0.6469108054625852, "percentage": 33.1, "elapsed_time": "14:00:14", "remaining_time": "1 day, 4:18:14", "throughput": 332.69, "total_tokens": 16772064} {"current_steps": 13245, "total_steps": 40000, "loss": 0.064, "lr": 0.22590958068294098, "epoch": 0.6471551071262795, "percentage": 33.11, "elapsed_time": "14:00:17", "remaining_time": "1 day, 4:17:23", "throughput": 332.8, "total_tokens": 16778624} {"current_steps": 13250, "total_steps": 40000, "loss": 0.0971, "lr": 0.22585876962278478, "epoch": 0.6473994087899738, "percentage": 33.12, "elapsed_time": "14:00:20", "remaining_time": "1 day, 4:16:31", "throughput": 332.91, "total_tokens": 16785216} {"current_steps": 13255, "total_steps": 40000, "loss": 0.0767, "lr": 0.22580794686425298, "epoch": 0.6476437104536682, "percentage": 33.14, "elapsed_time": "14:00:23", "remaining_time": "1 day, 4:15:40", "throughput": 333.01, "total_tokens": 16791584} {"current_steps": 13260, "total_steps": 40000, "loss": 0.0706, "lr": 0.22575711241518312, "epoch": 0.6478880121173625, "percentage": 33.15, "elapsed_time": "14:00:26", "remaining_time": "1 day, 4:14:49", "throughput": 333.12, "total_tokens": 16797920} {"current_steps": 13265, "total_steps": 40000, "loss": 0.0786, "lr": 0.22570626628341453, "epoch": 0.6481323137810568, "percentage": 33.16, "elapsed_time": "14:00:29", "remaining_time": "1 day, 4:13:58", "throughput": 333.21, "total_tokens": 16803648} {"current_steps": 13270, "total_steps": 40000, "loss": 0.0664, "lr": 0.22565540847678828, "epoch": 0.6483766154447512, "percentage": 33.17, "elapsed_time": "14:00:32", "remaining_time": "1 day, 4:13:07", "throughput": 333.32, "total_tokens": 16810112} {"current_steps": 13275, "total_steps": 40000, "loss": 0.0665, "lr": 0.2256045390031473, "epoch": 0.6486209171084455, "percentage": 33.19, "elapsed_time": "14:00:35", "remaining_time": "1 day, 4:12:16", "throughput": 333.42, "total_tokens": 16816320} {"current_steps": 13280, "total_steps": 40000, "loss": 0.0876, "lr": 0.22555365787033627, "epoch": 0.6488652187721399, "percentage": 33.2, "elapsed_time": "14:00:38", "remaining_time": "1 day, 4:11:25", "throughput": 333.53, "total_tokens": 16823040} {"current_steps": 13285, "total_steps": 40000, "loss": 0.0669, "lr": 0.22550276508620173, "epoch": 0.6491095204358341, "percentage": 33.21, "elapsed_time": "14:00:42", "remaining_time": "1 day, 4:10:34", "throughput": 333.65, "total_tokens": 16830144} {"current_steps": 13290, "total_steps": 40000, "loss": 0.0838, "lr": 0.22545186065859202, "epoch": 0.6493538220995285, "percentage": 33.23, "elapsed_time": "14:00:45", "remaining_time": "1 day, 4:09:43", "throughput": 333.76, "total_tokens": 16836640} {"current_steps": 13295, "total_steps": 40000, "loss": 0.0645, "lr": 0.2254009445953572, "epoch": 0.6495981237632228, "percentage": 33.24, "elapsed_time": "14:00:48", "remaining_time": "1 day, 4:08:53", "throughput": 333.87, "total_tokens": 16843328} {"current_steps": 13300, "total_steps": 40000, "loss": 0.0481, "lr": 0.22535001690434917, "epoch": 0.6498424254269172, "percentage": 33.25, "elapsed_time": "14:00:51", "remaining_time": "1 day, 4:08:02", "throughput": 333.98, "total_tokens": 16849792} {"current_steps": 13305, "total_steps": 40000, "loss": 0.0441, "lr": 0.22529907759342163, "epoch": 0.6500867270906114, "percentage": 33.26, "elapsed_time": "14:00:54", "remaining_time": "1 day, 4:07:11", "throughput": 334.09, "total_tokens": 16856128} {"current_steps": 13310, "total_steps": 40000, "loss": 0.1082, "lr": 0.22524812667043007, "epoch": 0.6503310287543058, "percentage": 33.27, "elapsed_time": "14:00:57", "remaining_time": "1 day, 4:06:20", "throughput": 334.19, "total_tokens": 16862592} {"current_steps": 13315, "total_steps": 40000, "loss": 0.0707, "lr": 0.22519716414323177, "epoch": 0.6505753304180002, "percentage": 33.29, "elapsed_time": "14:01:00", "remaining_time": "1 day, 4:05:30", "throughput": 334.3, "total_tokens": 16869024} {"current_steps": 13320, "total_steps": 40000, "loss": 0.0594, "lr": 0.22514619001968567, "epoch": 0.6508196320816945, "percentage": 33.3, "elapsed_time": "14:01:03", "remaining_time": "1 day, 4:04:39", "throughput": 334.41, "total_tokens": 16875520} {"current_steps": 13325, "total_steps": 40000, "loss": 0.059, "lr": 0.2250952043076528, "epoch": 0.6510639337453888, "percentage": 33.31, "elapsed_time": "14:01:07", "remaining_time": "1 day, 4:03:48", "throughput": 334.51, "total_tokens": 16881984} {"current_steps": 13330, "total_steps": 40000, "loss": 0.0783, "lr": 0.2250442070149957, "epoch": 0.6513082354090831, "percentage": 33.32, "elapsed_time": "14:01:10", "remaining_time": "1 day, 4:02:58", "throughput": 334.62, "total_tokens": 16888448} {"current_steps": 13335, "total_steps": 40000, "loss": 0.0519, "lr": 0.22499319814957885, "epoch": 0.6515525370727775, "percentage": 33.34, "elapsed_time": "14:01:13", "remaining_time": "1 day, 4:02:07", "throughput": 334.72, "total_tokens": 16894528} {"current_steps": 13340, "total_steps": 40000, "loss": 0.0511, "lr": 0.2249421777192684, "epoch": 0.6517968387364718, "percentage": 33.35, "elapsed_time": "14:01:16", "remaining_time": "1 day, 4:01:16", "throughput": 334.83, "total_tokens": 16900896} {"current_steps": 13345, "total_steps": 40000, "loss": 0.0734, "lr": 0.22489114573193236, "epoch": 0.6520411404001661, "percentage": 33.36, "elapsed_time": "14:01:19", "remaining_time": "1 day, 4:00:26", "throughput": 334.93, "total_tokens": 16907072} {"current_steps": 13350, "total_steps": 40000, "loss": 0.0478, "lr": 0.2248401021954405, "epoch": 0.6522854420638604, "percentage": 33.38, "elapsed_time": "14:01:22", "remaining_time": "1 day, 3:59:35", "throughput": 335.03, "total_tokens": 16913152} {"current_steps": 13355, "total_steps": 40000, "loss": 0.0905, "lr": 0.22478904711766443, "epoch": 0.6525297437275548, "percentage": 33.39, "elapsed_time": "14:01:25", "remaining_time": "1 day, 3:58:45", "throughput": 335.14, "total_tokens": 16920000} {"current_steps": 13360, "total_steps": 40000, "loss": 0.0507, "lr": 0.22473798050647734, "epoch": 0.6527740453912492, "percentage": 33.4, "elapsed_time": "14:01:28", "remaining_time": "1 day, 3:57:55", "throughput": 335.25, "total_tokens": 16926496} {"current_steps": 13365, "total_steps": 40000, "loss": 0.0734, "lr": 0.22468690236975453, "epoch": 0.6530183470549434, "percentage": 33.41, "elapsed_time": "14:01:31", "remaining_time": "1 day, 3:57:04", "throughput": 335.36, "total_tokens": 16932672} {"current_steps": 13370, "total_steps": 40000, "loss": 0.0871, "lr": 0.22463581271537272, "epoch": 0.6532626487186378, "percentage": 33.42, "elapsed_time": "14:01:34", "remaining_time": "1 day, 3:56:13", "throughput": 335.46, "total_tokens": 16938848} {"current_steps": 13375, "total_steps": 40000, "loss": 0.0487, "lr": 0.22458471155121076, "epoch": 0.6535069503823321, "percentage": 33.44, "elapsed_time": "14:01:37", "remaining_time": "1 day, 3:55:23", "throughput": 335.56, "total_tokens": 16945216} {"current_steps": 13380, "total_steps": 40000, "loss": 0.0768, "lr": 0.2245335988851489, "epoch": 0.6537512520460265, "percentage": 33.45, "elapsed_time": "14:01:40", "remaining_time": "1 day, 3:54:33", "throughput": 335.67, "total_tokens": 16951456} {"current_steps": 13385, "total_steps": 40000, "loss": 0.0805, "lr": 0.2244824747250695, "epoch": 0.6539955537097207, "percentage": 33.46, "elapsed_time": "14:01:43", "remaining_time": "1 day, 3:53:43", "throughput": 335.78, "total_tokens": 16958048} {"current_steps": 13390, "total_steps": 40000, "loss": 0.088, "lr": 0.22443133907885646, "epoch": 0.6542398553734151, "percentage": 33.48, "elapsed_time": "14:01:46", "remaining_time": "1 day, 3:52:52", "throughput": 335.86, "total_tokens": 16963392} {"current_steps": 13395, "total_steps": 40000, "loss": 0.0664, "lr": 0.22438019195439557, "epoch": 0.6544841570371094, "percentage": 33.49, "elapsed_time": "14:01:50", "remaining_time": "1 day, 3:52:02", "throughput": 335.97, "total_tokens": 16969952} {"current_steps": 13400, "total_steps": 40000, "loss": 0.0785, "lr": 0.22432903335957435, "epoch": 0.6547284587008038, "percentage": 33.5, "elapsed_time": "14:01:53", "remaining_time": "1 day, 3:51:12", "throughput": 336.07, "total_tokens": 16976192} {"current_steps": 13400, "total_steps": 40000, "eval_loss": 0.07011739164590836, "epoch": 0.6547284587008038, "percentage": 33.5, "elapsed_time": "14:12:33", "remaining_time": "1 day, 4:12:22", "throughput": 331.87, "total_tokens": 16976192} {"current_steps": 13405, "total_steps": 40000, "loss": 0.0445, "lr": 0.22427786330228214, "epoch": 0.654972760364498, "percentage": 33.51, "elapsed_time": "14:12:36", "remaining_time": "1 day, 4:11:33", "throughput": 331.97, "total_tokens": 16982400} {"current_steps": 13410, "total_steps": 40000, "loss": 0.0671, "lr": 0.22422668179040997, "epoch": 0.6552170620281924, "percentage": 33.52, "elapsed_time": "14:12:39", "remaining_time": "1 day, 4:10:42", "throughput": 332.07, "total_tokens": 16988704} {"current_steps": 13415, "total_steps": 40000, "loss": 0.0552, "lr": 0.2241754888318507, "epoch": 0.6554613636918868, "percentage": 33.54, "elapsed_time": "14:12:42", "remaining_time": "1 day, 4:09:51", "throughput": 332.17, "total_tokens": 16994752} {"current_steps": 13420, "total_steps": 40000, "loss": 0.0908, "lr": 0.22412428443449886, "epoch": 0.6557056653555811, "percentage": 33.55, "elapsed_time": "14:12:45", "remaining_time": "1 day, 4:09:00", "throughput": 332.28, "total_tokens": 17001280} {"current_steps": 13425, "total_steps": 40000, "loss": 0.0584, "lr": 0.22407306860625087, "epoch": 0.6559499670192754, "percentage": 33.56, "elapsed_time": "14:12:49", "remaining_time": "1 day, 4:08:10", "throughput": 332.38, "total_tokens": 17007680} {"current_steps": 13430, "total_steps": 40000, "loss": 0.0633, "lr": 0.22402184135500483, "epoch": 0.6561942686829697, "percentage": 33.58, "elapsed_time": "14:12:52", "remaining_time": "1 day, 4:07:19", "throughput": 332.48, "total_tokens": 17013760} {"current_steps": 13435, "total_steps": 40000, "loss": 0.0391, "lr": 0.22397060268866067, "epoch": 0.6564385703466641, "percentage": 33.59, "elapsed_time": "14:12:55", "remaining_time": "1 day, 4:06:28", "throughput": 332.58, "total_tokens": 17019968} {"current_steps": 13440, "total_steps": 40000, "loss": 0.0646, "lr": 0.22391935261511994, "epoch": 0.6566828720103584, "percentage": 33.6, "elapsed_time": "14:12:58", "remaining_time": "1 day, 4:05:38", "throughput": 332.69, "total_tokens": 17026400} {"current_steps": 13445, "total_steps": 40000, "loss": 0.0416, "lr": 0.22386809114228615, "epoch": 0.6569271736740527, "percentage": 33.61, "elapsed_time": "14:13:01", "remaining_time": "1 day, 4:04:47", "throughput": 332.79, "total_tokens": 17032640} {"current_steps": 13450, "total_steps": 40000, "loss": 0.0686, "lr": 0.22381681827806446, "epoch": 0.657171475337747, "percentage": 33.62, "elapsed_time": "14:13:04", "remaining_time": "1 day, 4:03:56", "throughput": 332.89, "total_tokens": 17039040} {"current_steps": 13455, "total_steps": 40000, "loss": 0.092, "lr": 0.22376553403036173, "epoch": 0.6574157770014414, "percentage": 33.64, "elapsed_time": "14:13:07", "remaining_time": "1 day, 4:03:06", "throughput": 333.0, "total_tokens": 17045216} {"current_steps": 13460, "total_steps": 40000, "loss": 0.0795, "lr": 0.22371423840708662, "epoch": 0.6576600786651358, "percentage": 33.65, "elapsed_time": "14:13:10", "remaining_time": "1 day, 4:02:15", "throughput": 333.1, "total_tokens": 17051488} {"current_steps": 13465, "total_steps": 40000, "loss": 0.0628, "lr": 0.22366293141614962, "epoch": 0.65790438032883, "percentage": 33.66, "elapsed_time": "14:13:13", "remaining_time": "1 day, 4:01:25", "throughput": 333.2, "total_tokens": 17057600} {"current_steps": 13470, "total_steps": 40000, "loss": 0.0586, "lr": 0.22361161306546287, "epoch": 0.6581486819925244, "percentage": 33.67, "elapsed_time": "14:13:16", "remaining_time": "1 day, 4:00:35", "throughput": 333.31, "total_tokens": 17064320} {"current_steps": 13475, "total_steps": 40000, "loss": 0.0654, "lr": 0.22356028336294037, "epoch": 0.6583929836562187, "percentage": 33.69, "elapsed_time": "14:13:19", "remaining_time": "1 day, 3:59:44", "throughput": 333.41, "total_tokens": 17070432} {"current_steps": 13480, "total_steps": 40000, "loss": 0.0712, "lr": 0.2235089423164977, "epoch": 0.6586372853199131, "percentage": 33.7, "elapsed_time": "14:13:22", "remaining_time": "1 day, 3:58:54", "throughput": 333.51, "total_tokens": 17076896} {"current_steps": 13485, "total_steps": 40000, "loss": 0.0724, "lr": 0.22345758993405243, "epoch": 0.6588815869836073, "percentage": 33.71, "elapsed_time": "14:13:26", "remaining_time": "1 day, 3:58:04", "throughput": 333.62, "total_tokens": 17083552} {"current_steps": 13490, "total_steps": 40000, "loss": 0.0696, "lr": 0.2234062262235236, "epoch": 0.6591258886473017, "percentage": 33.73, "elapsed_time": "14:13:29", "remaining_time": "1 day, 3:57:14", "throughput": 333.72, "total_tokens": 17089568} {"current_steps": 13495, "total_steps": 40000, "loss": 0.0786, "lr": 0.22335485119283222, "epoch": 0.659370190310996, "percentage": 33.74, "elapsed_time": "14:13:32", "remaining_time": "1 day, 3:56:23", "throughput": 333.82, "total_tokens": 17095520} {"current_steps": 13500, "total_steps": 40000, "loss": 0.0664, "lr": 0.22330346484990093, "epoch": 0.6596144919746904, "percentage": 33.75, "elapsed_time": "14:13:35", "remaining_time": "1 day, 3:55:33", "throughput": 333.92, "total_tokens": 17101632} {"current_steps": 13505, "total_steps": 40000, "loss": 0.0857, "lr": 0.22325206720265425, "epoch": 0.6598587936383846, "percentage": 33.76, "elapsed_time": "14:13:38", "remaining_time": "1 day, 3:54:43", "throughput": 334.02, "total_tokens": 17108096} {"current_steps": 13510, "total_steps": 40000, "loss": 0.1081, "lr": 0.2232006582590182, "epoch": 0.660103095302079, "percentage": 33.77, "elapsed_time": "14:13:41", "remaining_time": "1 day, 3:53:53", "throughput": 334.14, "total_tokens": 17114944} {"current_steps": 13515, "total_steps": 40000, "loss": 0.0584, "lr": 0.22314923802692077, "epoch": 0.6603473969657734, "percentage": 33.79, "elapsed_time": "14:13:44", "remaining_time": "1 day, 3:53:03", "throughput": 334.24, "total_tokens": 17121376} {"current_steps": 13520, "total_steps": 40000, "loss": 0.067, "lr": 0.22309780651429156, "epoch": 0.6605916986294676, "percentage": 33.8, "elapsed_time": "14:13:47", "remaining_time": "1 day, 3:52:13", "throughput": 334.35, "total_tokens": 17128192} {"current_steps": 13525, "total_steps": 40000, "loss": 0.0473, "lr": 0.22304636372906203, "epoch": 0.660836000293162, "percentage": 33.81, "elapsed_time": "14:13:50", "remaining_time": "1 day, 3:51:23", "throughput": 334.46, "total_tokens": 17134656} {"current_steps": 13530, "total_steps": 40000, "loss": 0.0675, "lr": 0.22299490967916522, "epoch": 0.6610803019568563, "percentage": 33.83, "elapsed_time": "14:13:54", "remaining_time": "1 day, 3:50:33", "throughput": 334.56, "total_tokens": 17140864} {"current_steps": 13535, "total_steps": 40000, "loss": 0.0301, "lr": 0.22294344437253602, "epoch": 0.6613246036205507, "percentage": 33.84, "elapsed_time": "14:13:57", "remaining_time": "1 day, 3:49:44", "throughput": 334.68, "total_tokens": 17147808} {"current_steps": 13540, "total_steps": 40000, "loss": 0.0605, "lr": 0.22289196781711101, "epoch": 0.661568905284245, "percentage": 33.85, "elapsed_time": "14:14:00", "remaining_time": "1 day, 3:48:54", "throughput": 334.77, "total_tokens": 17153600} {"current_steps": 13545, "total_steps": 40000, "loss": 0.0467, "lr": 0.2228404800208286, "epoch": 0.6618132069479393, "percentage": 33.86, "elapsed_time": "14:14:03", "remaining_time": "1 day, 3:48:04", "throughput": 334.88, "total_tokens": 17160544} {"current_steps": 13550, "total_steps": 40000, "loss": 0.0709, "lr": 0.22278898099162875, "epoch": 0.6620575086116336, "percentage": 33.88, "elapsed_time": "14:14:06", "remaining_time": "1 day, 3:47:14", "throughput": 334.98, "total_tokens": 17166368} {"current_steps": 13555, "total_steps": 40000, "loss": 0.0717, "lr": 0.22273747073745337, "epoch": 0.662301810275328, "percentage": 33.89, "elapsed_time": "14:14:09", "remaining_time": "1 day, 3:46:24", "throughput": 335.09, "total_tokens": 17173152} {"current_steps": 13560, "total_steps": 40000, "loss": 0.0754, "lr": 0.22268594926624588, "epoch": 0.6625461119390224, "percentage": 33.9, "elapsed_time": "14:14:12", "remaining_time": "1 day, 3:45:35", "throughput": 335.19, "total_tokens": 17179520} {"current_steps": 13565, "total_steps": 40000, "loss": 0.0671, "lr": 0.22263441658595162, "epoch": 0.6627904136027166, "percentage": 33.91, "elapsed_time": "14:14:15", "remaining_time": "1 day, 3:44:45", "throughput": 335.29, "total_tokens": 17185600} {"current_steps": 13570, "total_steps": 40000, "loss": 0.0473, "lr": 0.2225828727045175, "epoch": 0.663034715266411, "percentage": 33.92, "elapsed_time": "14:14:18", "remaining_time": "1 day, 3:43:55", "throughput": 335.39, "total_tokens": 17191712} {"current_steps": 13575, "total_steps": 40000, "loss": 0.0509, "lr": 0.22253131762989228, "epoch": 0.6632790169301053, "percentage": 33.94, "elapsed_time": "14:14:21", "remaining_time": "1 day, 3:43:06", "throughput": 335.5, "total_tokens": 17198560} {"current_steps": 13580, "total_steps": 40000, "loss": 0.086, "lr": 0.2224797513700264, "epoch": 0.6635233185937996, "percentage": 33.95, "elapsed_time": "14:14:25", "remaining_time": "1 day, 3:42:16", "throughput": 335.61, "total_tokens": 17205088} {"current_steps": 13585, "total_steps": 40000, "loss": 0.0646, "lr": 0.22242817393287204, "epoch": 0.6637676202574939, "percentage": 33.96, "elapsed_time": "14:14:28", "remaining_time": "1 day, 3:41:26", "throughput": 335.71, "total_tokens": 17211392} {"current_steps": 13590, "total_steps": 40000, "loss": 0.0464, "lr": 0.22237658532638305, "epoch": 0.6640119219211883, "percentage": 33.98, "elapsed_time": "14:14:31", "remaining_time": "1 day, 3:40:37", "throughput": 335.82, "total_tokens": 17218016} {"current_steps": 13595, "total_steps": 40000, "loss": 0.0554, "lr": 0.22232498555851513, "epoch": 0.6642562235848826, "percentage": 33.99, "elapsed_time": "14:14:34", "remaining_time": "1 day, 3:39:48", "throughput": 335.93, "total_tokens": 17224384} {"current_steps": 13600, "total_steps": 40000, "loss": 0.0507, "lr": 0.22227337463722546, "epoch": 0.664500525248577, "percentage": 34.0, "elapsed_time": "14:14:37", "remaining_time": "1 day, 3:38:58", "throughput": 336.02, "total_tokens": 17230496} {"current_steps": 13600, "total_steps": 40000, "eval_loss": 0.07045367360115051, "epoch": 0.664500525248577, "percentage": 34.0, "elapsed_time": "14:25:17", "remaining_time": "1 day, 3:59:41", "throughput": 331.88, "total_tokens": 17230496} {"current_steps": 13605, "total_steps": 40000, "loss": 0.0788, "lr": 0.2222217525704732, "epoch": 0.6647448269122713, "percentage": 34.01, "elapsed_time": "14:25:21", "remaining_time": "1 day, 3:58:52", "throughput": 331.98, "total_tokens": 17237024} {"current_steps": 13610, "total_steps": 40000, "loss": 0.0723, "lr": 0.22217011936621908, "epoch": 0.6649891285759656, "percentage": 34.02, "elapsed_time": "14:25:24", "remaining_time": "1 day, 3:58:02", "throughput": 332.09, "total_tokens": 17243520} {"current_steps": 13615, "total_steps": 40000, "loss": 0.0697, "lr": 0.22211847503242566, "epoch": 0.66523343023966, "percentage": 34.04, "elapsed_time": "14:25:27", "remaining_time": "1 day, 3:57:12", "throughput": 332.19, "total_tokens": 17249760} {"current_steps": 13620, "total_steps": 40000, "loss": 0.0463, "lr": 0.22206681957705704, "epoch": 0.6654777319033542, "percentage": 34.05, "elapsed_time": "14:25:30", "remaining_time": "1 day, 3:56:22", "throughput": 332.29, "total_tokens": 17256096} {"current_steps": 13625, "total_steps": 40000, "loss": 0.0796, "lr": 0.2220151530080792, "epoch": 0.6657220335670486, "percentage": 34.06, "elapsed_time": "14:25:33", "remaining_time": "1 day, 3:55:32", "throughput": 332.4, "total_tokens": 17263040} {"current_steps": 13630, "total_steps": 40000, "loss": 0.0513, "lr": 0.2219634753334598, "epoch": 0.6659663352307429, "percentage": 34.08, "elapsed_time": "14:25:36", "remaining_time": "1 day, 3:54:42", "throughput": 332.51, "total_tokens": 17269472} {"current_steps": 13635, "total_steps": 40000, "loss": 0.1029, "lr": 0.22191178656116817, "epoch": 0.6662106368944373, "percentage": 34.09, "elapsed_time": "14:25:40", "remaining_time": "1 day, 3:53:52", "throughput": 332.61, "total_tokens": 17275552} {"current_steps": 13640, "total_steps": 40000, "loss": 0.0479, "lr": 0.2218600866991753, "epoch": 0.6664549385581315, "percentage": 34.1, "elapsed_time": "14:25:43", "remaining_time": "1 day, 3:53:02", "throughput": 332.71, "total_tokens": 17281920} {"current_steps": 13645, "total_steps": 40000, "loss": 0.0558, "lr": 0.221808375755454, "epoch": 0.6666992402218259, "percentage": 34.11, "elapsed_time": "14:25:46", "remaining_time": "1 day, 3:52:12", "throughput": 332.81, "total_tokens": 17288032} {"current_steps": 13650, "total_steps": 40000, "loss": 0.0744, "lr": 0.22175665373797881, "epoch": 0.6669435418855202, "percentage": 34.12, "elapsed_time": "14:25:49", "remaining_time": "1 day, 3:51:22", "throughput": 332.91, "total_tokens": 17294304} {"current_steps": 13655, "total_steps": 40000, "loss": 0.0755, "lr": 0.22170492065472583, "epoch": 0.6671878435492146, "percentage": 34.14, "elapsed_time": "14:25:52", "remaining_time": "1 day, 3:50:33", "throughput": 333.01, "total_tokens": 17300704} {"current_steps": 13660, "total_steps": 40000, "loss": 0.0587, "lr": 0.221653176513673, "epoch": 0.667432145212909, "percentage": 34.15, "elapsed_time": "14:25:55", "remaining_time": "1 day, 3:49:43", "throughput": 333.12, "total_tokens": 17307200} {"current_steps": 13665, "total_steps": 40000, "loss": 0.0415, "lr": 0.2216014213227999, "epoch": 0.6676764468766032, "percentage": 34.16, "elapsed_time": "14:25:58", "remaining_time": "1 day, 3:48:53", "throughput": 333.22, "total_tokens": 17313376} {"current_steps": 13670, "total_steps": 40000, "loss": 0.0837, "lr": 0.22154965509008784, "epoch": 0.6679207485402976, "percentage": 34.17, "elapsed_time": "14:26:01", "remaining_time": "1 day, 3:48:04", "throughput": 333.31, "total_tokens": 17319456} {"current_steps": 13675, "total_steps": 40000, "loss": 0.0623, "lr": 0.2214978778235198, "epoch": 0.6681650502039919, "percentage": 34.19, "elapsed_time": "14:26:04", "remaining_time": "1 day, 3:47:14", "throughput": 333.41, "total_tokens": 17325792} {"current_steps": 13680, "total_steps": 40000, "loss": 0.0553, "lr": 0.2214460895310805, "epoch": 0.6684093518676862, "percentage": 34.2, "elapsed_time": "14:26:07", "remaining_time": "1 day, 3:46:24", "throughput": 333.52, "total_tokens": 17332320} {"current_steps": 13685, "total_steps": 40000, "loss": 0.0398, "lr": 0.22139429022075635, "epoch": 0.6686536535313805, "percentage": 34.21, "elapsed_time": "14:26:10", "remaining_time": "1 day, 3:45:35", "throughput": 333.62, "total_tokens": 17338688} {"current_steps": 13690, "total_steps": 40000, "loss": 0.0677, "lr": 0.22134247990053546, "epoch": 0.6688979551950749, "percentage": 34.23, "elapsed_time": "14:26:13", "remaining_time": "1 day, 3:44:45", "throughput": 333.72, "total_tokens": 17344768} {"current_steps": 13695, "total_steps": 40000, "loss": 0.0753, "lr": 0.2212906585784076, "epoch": 0.6691422568587692, "percentage": 34.24, "elapsed_time": "14:26:17", "remaining_time": "1 day, 3:43:56", "throughput": 333.82, "total_tokens": 17351008} {"current_steps": 13700, "total_steps": 40000, "loss": 0.0726, "lr": 0.22123882626236432, "epoch": 0.6693865585224635, "percentage": 34.25, "elapsed_time": "14:26:20", "remaining_time": "1 day, 3:43:06", "throughput": 333.92, "total_tokens": 17357024} {"current_steps": 13705, "total_steps": 40000, "loss": 0.0594, "lr": 0.2211869829603988, "epoch": 0.6696308601861579, "percentage": 34.26, "elapsed_time": "14:26:23", "remaining_time": "1 day, 3:42:17", "throughput": 334.02, "total_tokens": 17363360} {"current_steps": 13710, "total_steps": 40000, "loss": 0.0539, "lr": 0.22113512868050592, "epoch": 0.6698751618498522, "percentage": 34.27, "elapsed_time": "14:26:26", "remaining_time": "1 day, 3:41:27", "throughput": 334.12, "total_tokens": 17369696} {"current_steps": 13715, "total_steps": 40000, "loss": 0.0477, "lr": 0.2210832634306822, "epoch": 0.6701194635135466, "percentage": 34.29, "elapsed_time": "14:26:29", "remaining_time": "1 day, 3:40:38", "throughput": 334.23, "total_tokens": 17376544} {"current_steps": 13720, "total_steps": 40000, "loss": 0.0694, "lr": 0.22103138721892598, "epoch": 0.6703637651772408, "percentage": 34.3, "elapsed_time": "14:26:32", "remaining_time": "1 day, 3:39:49", "throughput": 334.34, "total_tokens": 17383136} {"current_steps": 13725, "total_steps": 40000, "loss": 0.0658, "lr": 0.22097950005323724, "epoch": 0.6706080668409352, "percentage": 34.31, "elapsed_time": "14:26:35", "remaining_time": "1 day, 3:38:59", "throughput": 334.45, "total_tokens": 17389760} {"current_steps": 13730, "total_steps": 40000, "loss": 0.0739, "lr": 0.22092760194161762, "epoch": 0.6708523685046295, "percentage": 34.33, "elapsed_time": "14:26:38", "remaining_time": "1 day, 3:38:10", "throughput": 334.55, "total_tokens": 17396064} {"current_steps": 13735, "total_steps": 40000, "loss": 0.0582, "lr": 0.2208756928920704, "epoch": 0.6710966701683239, "percentage": 34.34, "elapsed_time": "14:26:41", "remaining_time": "1 day, 3:37:21", "throughput": 334.65, "total_tokens": 17402592} {"current_steps": 13740, "total_steps": 40000, "loss": 0.0547, "lr": 0.22082377291260072, "epoch": 0.6713409718320181, "percentage": 34.35, "elapsed_time": "14:26:44", "remaining_time": "1 day, 3:36:32", "throughput": 334.76, "total_tokens": 17409152} {"current_steps": 13745, "total_steps": 40000, "loss": 0.0439, "lr": 0.2207718420112152, "epoch": 0.6715852734957125, "percentage": 34.36, "elapsed_time": "14:26:47", "remaining_time": "1 day, 3:35:42", "throughput": 334.86, "total_tokens": 17415168} {"current_steps": 13750, "total_steps": 40000, "loss": 0.0705, "lr": 0.22071990019592228, "epoch": 0.6718295751594069, "percentage": 34.38, "elapsed_time": "14:26:51", "remaining_time": "1 day, 3:34:53", "throughput": 334.96, "total_tokens": 17421696} {"current_steps": 13755, "total_steps": 40000, "loss": 0.0667, "lr": 0.22066794747473198, "epoch": 0.6720738768231012, "percentage": 34.39, "elapsed_time": "14:26:54", "remaining_time": "1 day, 3:34:04", "throughput": 335.07, "total_tokens": 17428416} {"current_steps": 13760, "total_steps": 40000, "loss": 0.095, "lr": 0.2206159838556562, "epoch": 0.6723181784867955, "percentage": 34.4, "elapsed_time": "14:26:57", "remaining_time": "1 day, 3:33:15", "throughput": 335.17, "total_tokens": 17434848} {"current_steps": 13765, "total_steps": 40000, "loss": 0.0636, "lr": 0.2205640093467082, "epoch": 0.6725624801504898, "percentage": 34.41, "elapsed_time": "14:27:00", "remaining_time": "1 day, 3:32:26", "throughput": 335.28, "total_tokens": 17441344} {"current_steps": 13770, "total_steps": 40000, "loss": 0.039, "lr": 0.22051202395590322, "epoch": 0.6728067818141842, "percentage": 34.42, "elapsed_time": "14:27:03", "remaining_time": "1 day, 3:31:37", "throughput": 335.38, "total_tokens": 17447808} {"current_steps": 13775, "total_steps": 40000, "loss": 0.0633, "lr": 0.22046002769125808, "epoch": 0.6730510834778785, "percentage": 34.44, "elapsed_time": "14:27:06", "remaining_time": "1 day, 3:30:48", "throughput": 335.48, "total_tokens": 17453856} {"current_steps": 13780, "total_steps": 40000, "loss": 0.0772, "lr": 0.2204080205607912, "epoch": 0.6732953851415728, "percentage": 34.45, "elapsed_time": "14:27:09", "remaining_time": "1 day, 3:29:59", "throughput": 335.58, "total_tokens": 17460320} {"current_steps": 13785, "total_steps": 40000, "loss": 0.1, "lr": 0.22035600257252272, "epoch": 0.6735396868052671, "percentage": 34.46, "elapsed_time": "14:27:12", "remaining_time": "1 day, 3:29:10", "throughput": 335.69, "total_tokens": 17466688} {"current_steps": 13790, "total_steps": 40000, "loss": 0.0865, "lr": 0.2203039737344745, "epoch": 0.6737839884689615, "percentage": 34.48, "elapsed_time": "14:27:15", "remaining_time": "1 day, 3:28:21", "throughput": 335.79, "total_tokens": 17472896} {"current_steps": 13795, "total_steps": 40000, "loss": 0.0973, "lr": 0.22025193405467003, "epoch": 0.6740282901326557, "percentage": 34.49, "elapsed_time": "14:27:18", "remaining_time": "1 day, 3:27:32", "throughput": 335.89, "total_tokens": 17479200} {"current_steps": 13800, "total_steps": 40000, "loss": 0.049, "lr": 0.2201998835411345, "epoch": 0.6742725917963501, "percentage": 34.5, "elapsed_time": "14:27:21", "remaining_time": "1 day, 3:26:43", "throughput": 335.98, "total_tokens": 17485120} {"current_steps": 13800, "total_steps": 40000, "eval_loss": 0.06976202875375748, "epoch": 0.6742725917963501, "percentage": 34.5, "elapsed_time": "14:38:01", "remaining_time": "1 day, 3:46:59", "throughput": 331.9, "total_tokens": 17485120} {"current_steps": 13805, "total_steps": 40000, "loss": 0.09, "lr": 0.22014782220189474, "epoch": 0.6745168934600445, "percentage": 34.51, "elapsed_time": "14:38:05", "remaining_time": "1 day, 3:46:11", "throughput": 332.0, "total_tokens": 17491776} {"current_steps": 13810, "total_steps": 40000, "loss": 0.0593, "lr": 0.2200957500449793, "epoch": 0.6747611951237388, "percentage": 34.52, "elapsed_time": "14:38:08", "remaining_time": "1 day, 3:45:21", "throughput": 332.1, "total_tokens": 17497920} {"current_steps": 13815, "total_steps": 40000, "loss": 0.0514, "lr": 0.22004366707841827, "epoch": 0.6750054967874332, "percentage": 34.54, "elapsed_time": "14:38:11", "remaining_time": "1 day, 3:44:32", "throughput": 332.2, "total_tokens": 17504160} {"current_steps": 13820, "total_steps": 40000, "loss": 0.0653, "lr": 0.21999157331024358, "epoch": 0.6752497984511274, "percentage": 34.55, "elapsed_time": "14:38:15", "remaining_time": "1 day, 3:43:43", "throughput": 332.3, "total_tokens": 17510784} {"current_steps": 13825, "total_steps": 40000, "loss": 0.067, "lr": 0.21993946874848871, "epoch": 0.6754941001148218, "percentage": 34.56, "elapsed_time": "14:38:18", "remaining_time": "1 day, 3:42:53", "throughput": 332.4, "total_tokens": 17517056} {"current_steps": 13830, "total_steps": 40000, "loss": 0.0806, "lr": 0.2198873534011888, "epoch": 0.6757384017785161, "percentage": 34.58, "elapsed_time": "14:38:21", "remaining_time": "1 day, 3:42:04", "throughput": 332.5, "total_tokens": 17523168} {"current_steps": 13835, "total_steps": 40000, "loss": 0.0428, "lr": 0.2198352272763808, "epoch": 0.6759827034422105, "percentage": 34.59, "elapsed_time": "14:38:24", "remaining_time": "1 day, 3:41:15", "throughput": 332.6, "total_tokens": 17529504} {"current_steps": 13840, "total_steps": 40000, "loss": 0.0587, "lr": 0.2197830903821031, "epoch": 0.6762270051059047, "percentage": 34.6, "elapsed_time": "14:38:27", "remaining_time": "1 day, 3:40:26", "throughput": 332.71, "total_tokens": 17536288} {"current_steps": 13845, "total_steps": 40000, "loss": 0.0667, "lr": 0.21973094272639598, "epoch": 0.6764713067695991, "percentage": 34.61, "elapsed_time": "14:38:30", "remaining_time": "1 day, 3:39:36", "throughput": 332.8, "total_tokens": 17542240} {"current_steps": 13850, "total_steps": 40000, "loss": 0.0719, "lr": 0.21967878431730117, "epoch": 0.6767156084332935, "percentage": 34.62, "elapsed_time": "14:38:33", "remaining_time": "1 day, 3:38:47", "throughput": 332.91, "total_tokens": 17548640} {"current_steps": 13855, "total_steps": 40000, "loss": 0.0728, "lr": 0.21962661516286217, "epoch": 0.6769599100969877, "percentage": 34.64, "elapsed_time": "14:38:36", "remaining_time": "1 day, 3:37:59", "throughput": 333.02, "total_tokens": 17555552} {"current_steps": 13860, "total_steps": 40000, "loss": 0.0584, "lr": 0.21957443527112414, "epoch": 0.6772042117606821, "percentage": 34.65, "elapsed_time": "14:38:40", "remaining_time": "1 day, 3:37:10", "throughput": 333.12, "total_tokens": 17562176} {"current_steps": 13865, "total_steps": 40000, "loss": 0.0859, "lr": 0.21952224465013384, "epoch": 0.6774485134243764, "percentage": 34.66, "elapsed_time": "14:38:43", "remaining_time": "1 day, 3:36:21", "throughput": 333.22, "total_tokens": 17568416} {"current_steps": 13870, "total_steps": 40000, "loss": 0.0416, "lr": 0.21947004330793976, "epoch": 0.6776928150880708, "percentage": 34.67, "elapsed_time": "14:38:46", "remaining_time": "1 day, 3:35:32", "throughput": 333.33, "total_tokens": 17575136} {"current_steps": 13875, "total_steps": 40000, "loss": 0.0551, "lr": 0.21941783125259198, "epoch": 0.677937116751765, "percentage": 34.69, "elapsed_time": "14:38:49", "remaining_time": "1 day, 3:34:43", "throughput": 333.43, "total_tokens": 17581408} {"current_steps": 13880, "total_steps": 40000, "loss": 0.1302, "lr": 0.21936560849214226, "epoch": 0.6781814184154594, "percentage": 34.7, "elapsed_time": "14:38:52", "remaining_time": "1 day, 3:33:54", "throughput": 333.53, "total_tokens": 17587904} {"current_steps": 13885, "total_steps": 40000, "loss": 0.0778, "lr": 0.21931337503464404, "epoch": 0.6784257200791537, "percentage": 34.71, "elapsed_time": "14:38:55", "remaining_time": "1 day, 3:33:05", "throughput": 333.63, "total_tokens": 17594432} {"current_steps": 13890, "total_steps": 40000, "loss": 0.0744, "lr": 0.21926113088815233, "epoch": 0.6786700217428481, "percentage": 34.73, "elapsed_time": "14:38:58", "remaining_time": "1 day, 3:32:16", "throughput": 333.74, "total_tokens": 17600800} {"current_steps": 13895, "total_steps": 40000, "loss": 0.0662, "lr": 0.2192088760607238, "epoch": 0.6789143234065425, "percentage": 34.74, "elapsed_time": "14:39:01", "remaining_time": "1 day, 3:31:27", "throughput": 333.84, "total_tokens": 17607552} {"current_steps": 13900, "total_steps": 40000, "loss": 0.0505, "lr": 0.2191566105604169, "epoch": 0.6791586250702367, "percentage": 34.75, "elapsed_time": "14:39:04", "remaining_time": "1 day, 3:30:39", "throughput": 333.94, "total_tokens": 17613728} {"current_steps": 13905, "total_steps": 40000, "loss": 0.1008, "lr": 0.21910433439529153, "epoch": 0.6794029267339311, "percentage": 34.76, "elapsed_time": "14:39:08", "remaining_time": "1 day, 3:29:50", "throughput": 334.04, "total_tokens": 17620000} {"current_steps": 13910, "total_steps": 40000, "loss": 0.0485, "lr": 0.2190520475734094, "epoch": 0.6796472283976254, "percentage": 34.77, "elapsed_time": "14:39:11", "remaining_time": "1 day, 3:29:01", "throughput": 334.15, "total_tokens": 17626848} {"current_steps": 13915, "total_steps": 40000, "loss": 0.0488, "lr": 0.2189997501028338, "epoch": 0.6798915300613197, "percentage": 34.79, "elapsed_time": "14:39:14", "remaining_time": "1 day, 3:28:13", "throughput": 334.25, "total_tokens": 17633056} {"current_steps": 13920, "total_steps": 40000, "loss": 0.091, "lr": 0.2189474419916296, "epoch": 0.680135831725014, "percentage": 34.8, "elapsed_time": "14:39:17", "remaining_time": "1 day, 3:27:24", "throughput": 334.34, "total_tokens": 17639072} {"current_steps": 13925, "total_steps": 40000, "loss": 0.0586, "lr": 0.21889512324786342, "epoch": 0.6803801333887084, "percentage": 34.81, "elapsed_time": "14:39:20", "remaining_time": "1 day, 3:26:35", "throughput": 334.45, "total_tokens": 17645600} {"current_steps": 13930, "total_steps": 40000, "loss": 0.099, "lr": 0.21884279387960345, "epoch": 0.6806244350524027, "percentage": 34.83, "elapsed_time": "14:39:23", "remaining_time": "1 day, 3:25:47", "throughput": 334.55, "total_tokens": 17652128} {"current_steps": 13935, "total_steps": 40000, "loss": 0.053, "lr": 0.2187904538949195, "epoch": 0.680868736716097, "percentage": 34.84, "elapsed_time": "14:39:26", "remaining_time": "1 day, 3:24:58", "throughput": 334.65, "total_tokens": 17658368} {"current_steps": 13940, "total_steps": 40000, "loss": 0.0861, "lr": 0.2187381033018831, "epoch": 0.6811130383797913, "percentage": 34.85, "elapsed_time": "14:39:29", "remaining_time": "1 day, 3:24:09", "throughput": 334.75, "total_tokens": 17664480} {"current_steps": 13945, "total_steps": 40000, "loss": 0.0907, "lr": 0.2186857421085673, "epoch": 0.6813573400434857, "percentage": 34.86, "elapsed_time": "14:39:32", "remaining_time": "1 day, 3:23:21", "throughput": 334.84, "total_tokens": 17670592} {"current_steps": 13950, "total_steps": 40000, "loss": 0.1106, "lr": 0.21863337032304697, "epoch": 0.6816016417071801, "percentage": 34.88, "elapsed_time": "14:39:35", "remaining_time": "1 day, 3:22:32", "throughput": 334.94, "total_tokens": 17676672} {"current_steps": 13955, "total_steps": 40000, "loss": 0.0894, "lr": 0.21858098795339845, "epoch": 0.6818459433708743, "percentage": 34.89, "elapsed_time": "14:39:38", "remaining_time": "1 day, 3:21:44", "throughput": 335.03, "total_tokens": 17682720} {"current_steps": 13960, "total_steps": 40000, "loss": 0.062, "lr": 0.21852859500769975, "epoch": 0.6820902450345687, "percentage": 34.9, "elapsed_time": "14:39:42", "remaining_time": "1 day, 3:20:55", "throughput": 335.14, "total_tokens": 17689120} {"current_steps": 13965, "total_steps": 40000, "loss": 0.0744, "lr": 0.21847619149403044, "epoch": 0.682334546698263, "percentage": 34.91, "elapsed_time": "14:39:45", "remaining_time": "1 day, 3:20:07", "throughput": 335.25, "total_tokens": 17696096} {"current_steps": 13970, "total_steps": 40000, "loss": 0.0678, "lr": 0.21842377742047195, "epoch": 0.6825788483619574, "percentage": 34.92, "elapsed_time": "14:39:48", "remaining_time": "1 day, 3:19:19", "throughput": 335.35, "total_tokens": 17702688} {"current_steps": 13975, "total_steps": 40000, "loss": 0.0666, "lr": 0.21837135279510705, "epoch": 0.6828231500256516, "percentage": 34.94, "elapsed_time": "14:39:51", "remaining_time": "1 day, 3:18:31", "throughput": 335.45, "total_tokens": 17708928} {"current_steps": 13980, "total_steps": 40000, "loss": 0.1021, "lr": 0.21831891762602038, "epoch": 0.683067451689346, "percentage": 34.95, "elapsed_time": "14:39:54", "remaining_time": "1 day, 3:17:42", "throughput": 335.55, "total_tokens": 17715488} {"current_steps": 13985, "total_steps": 40000, "loss": 0.1055, "lr": 0.21826647192129806, "epoch": 0.6833117533530403, "percentage": 34.96, "elapsed_time": "14:39:57", "remaining_time": "1 day, 3:16:54", "throughput": 335.65, "total_tokens": 17721376} {"current_steps": 13990, "total_steps": 40000, "loss": 0.0841, "lr": 0.21821401568902787, "epoch": 0.6835560550167347, "percentage": 34.98, "elapsed_time": "14:40:00", "remaining_time": "1 day, 3:16:06", "throughput": 335.75, "total_tokens": 17727616} {"current_steps": 13995, "total_steps": 40000, "loss": 0.0552, "lr": 0.21816154893729925, "epoch": 0.683800356680429, "percentage": 34.99, "elapsed_time": "14:40:03", "remaining_time": "1 day, 3:15:18", "throughput": 335.84, "total_tokens": 17733632} {"current_steps": 14000, "total_steps": 40000, "loss": 0.0616, "lr": 0.2181090716742032, "epoch": 0.6840446583441233, "percentage": 35.0, "elapsed_time": "14:40:06", "remaining_time": "1 day, 3:14:29", "throughput": 335.94, "total_tokens": 17739872} {"current_steps": 14000, "total_steps": 40000, "eval_loss": 0.07680020481348038, "epoch": 0.6840446583441233, "percentage": 35.0, "elapsed_time": "14:50:47", "remaining_time": "1 day, 3:34:18", "throughput": 331.91, "total_tokens": 17739872} {"current_steps": 14005, "total_steps": 40000, "loss": 0.101, "lr": 0.21805658390783236, "epoch": 0.6842889600078177, "percentage": 35.01, "elapsed_time": "14:50:51", "remaining_time": "1 day, 3:33:31", "throughput": 332.0, "total_tokens": 17745984} {"current_steps": 14010, "total_steps": 40000, "loss": 0.0558, "lr": 0.21800408564628107, "epoch": 0.684533261671512, "percentage": 35.02, "elapsed_time": "14:50:54", "remaining_time": "1 day, 3:32:43", "throughput": 332.11, "total_tokens": 17752800} {"current_steps": 14015, "total_steps": 40000, "loss": 0.0631, "lr": 0.21795157689764516, "epoch": 0.6847775633352063, "percentage": 35.04, "elapsed_time": "14:50:57", "remaining_time": "1 day, 3:31:54", "throughput": 332.21, "total_tokens": 17758976} {"current_steps": 14020, "total_steps": 40000, "loss": 0.0795, "lr": 0.21789905767002216, "epoch": 0.6850218649989006, "percentage": 35.05, "elapsed_time": "14:51:00", "remaining_time": "1 day, 3:31:05", "throughput": 332.31, "total_tokens": 17765600} {"current_steps": 14025, "total_steps": 40000, "loss": 0.0379, "lr": 0.2178465279715112, "epoch": 0.685266166662595, "percentage": 35.06, "elapsed_time": "14:51:03", "remaining_time": "1 day, 3:30:17", "throughput": 332.41, "total_tokens": 17772032} {"current_steps": 14030, "total_steps": 40000, "loss": 0.1025, "lr": 0.21779398781021303, "epoch": 0.6855104683262893, "percentage": 35.08, "elapsed_time": "14:51:06", "remaining_time": "1 day, 3:29:28", "throughput": 332.51, "total_tokens": 17778208} {"current_steps": 14035, "total_steps": 40000, "loss": 0.108, "lr": 0.21774143719422998, "epoch": 0.6857547699899836, "percentage": 35.09, "elapsed_time": "14:51:09", "remaining_time": "1 day, 3:28:39", "throughput": 332.61, "total_tokens": 17784384} {"current_steps": 14040, "total_steps": 40000, "loss": 0.049, "lr": 0.21768887613166601, "epoch": 0.685999071653678, "percentage": 35.1, "elapsed_time": "14:51:12", "remaining_time": "1 day, 3:27:51", "throughput": 332.7, "total_tokens": 17790432} {"current_steps": 14045, "total_steps": 40000, "loss": 0.0687, "lr": 0.2176363046306267, "epoch": 0.6862433733173723, "percentage": 35.11, "elapsed_time": "14:51:15", "remaining_time": "1 day, 3:27:02", "throughput": 332.81, "total_tokens": 17797312} {"current_steps": 14050, "total_steps": 40000, "loss": 0.0678, "lr": 0.21758372269921925, "epoch": 0.6864876749810667, "percentage": 35.12, "elapsed_time": "14:51:18", "remaining_time": "1 day, 3:26:14", "throughput": 332.9, "total_tokens": 17803392} {"current_steps": 14055, "total_steps": 40000, "loss": 0.0861, "lr": 0.21753113034555244, "epoch": 0.6867319766447609, "percentage": 35.14, "elapsed_time": "14:51:22", "remaining_time": "1 day, 3:25:25", "throughput": 333.01, "total_tokens": 17810048} {"current_steps": 14060, "total_steps": 40000, "loss": 0.0648, "lr": 0.2174785275777367, "epoch": 0.6869762783084553, "percentage": 35.15, "elapsed_time": "14:51:25", "remaining_time": "1 day, 3:24:37", "throughput": 333.1, "total_tokens": 17816064} {"current_steps": 14065, "total_steps": 40000, "loss": 0.0636, "lr": 0.21742591440388404, "epoch": 0.6872205799721496, "percentage": 35.16, "elapsed_time": "14:51:28", "remaining_time": "1 day, 3:23:49", "throughput": 333.2, "total_tokens": 17822496} {"current_steps": 14070, "total_steps": 40000, "loss": 0.071, "lr": 0.21737329083210802, "epoch": 0.687464881635844, "percentage": 35.17, "elapsed_time": "14:51:31", "remaining_time": "1 day, 3:23:00", "throughput": 333.3, "total_tokens": 17828672} {"current_steps": 14075, "total_steps": 40000, "loss": 0.064, "lr": 0.2173206568705239, "epoch": 0.6877091832995382, "percentage": 35.19, "elapsed_time": "14:51:34", "remaining_time": "1 day, 3:22:12", "throughput": 333.41, "total_tokens": 17835712} {"current_steps": 14080, "total_steps": 40000, "loss": 0.0885, "lr": 0.2172680125272485, "epoch": 0.6879534849632326, "percentage": 35.2, "elapsed_time": "14:51:37", "remaining_time": "1 day, 3:21:24", "throughput": 333.5, "total_tokens": 17841408} {"current_steps": 14085, "total_steps": 40000, "loss": 0.0752, "lr": 0.2172153578104002, "epoch": 0.6881977866269269, "percentage": 35.21, "elapsed_time": "14:51:40", "remaining_time": "1 day, 3:20:35", "throughput": 333.6, "total_tokens": 17847968} {"current_steps": 14090, "total_steps": 40000, "loss": 0.0648, "lr": 0.21716269272809902, "epoch": 0.6884420882906213, "percentage": 35.23, "elapsed_time": "14:51:43", "remaining_time": "1 day, 3:19:47", "throughput": 333.7, "total_tokens": 17854336} {"current_steps": 14095, "total_steps": 40000, "loss": 0.0861, "lr": 0.21711001728846666, "epoch": 0.6886863899543156, "percentage": 35.24, "elapsed_time": "14:51:46", "remaining_time": "1 day, 3:18:59", "throughput": 333.8, "total_tokens": 17860736} {"current_steps": 14100, "total_steps": 40000, "loss": 0.0614, "lr": 0.21705733149962628, "epoch": 0.6889306916180099, "percentage": 35.25, "elapsed_time": "14:51:49", "remaining_time": "1 day, 3:18:10", "throughput": 333.9, "total_tokens": 17866752} {"current_steps": 14105, "total_steps": 40000, "loss": 0.0618, "lr": 0.21700463536970263, "epoch": 0.6891749932817043, "percentage": 35.26, "elapsed_time": "14:51:52", "remaining_time": "1 day, 3:17:22", "throughput": 334.0, "total_tokens": 17873280} {"current_steps": 14110, "total_steps": 40000, "loss": 0.0553, "lr": 0.21695192890682222, "epoch": 0.6894192949453986, "percentage": 35.27, "elapsed_time": "14:51:56", "remaining_time": "1 day, 3:16:34", "throughput": 334.1, "total_tokens": 17879616} {"current_steps": 14115, "total_steps": 40000, "loss": 0.0696, "lr": 0.21689921211911298, "epoch": 0.6896635966090929, "percentage": 35.29, "elapsed_time": "14:51:59", "remaining_time": "1 day, 3:15:46", "throughput": 334.2, "total_tokens": 17886368} {"current_steps": 14120, "total_steps": 40000, "loss": 0.0806, "lr": 0.21684648501470452, "epoch": 0.6899078982727872, "percentage": 35.3, "elapsed_time": "14:52:02", "remaining_time": "1 day, 3:14:58", "throughput": 334.3, "total_tokens": 17892448} {"current_steps": 14125, "total_steps": 40000, "loss": 0.0603, "lr": 0.216793747601728, "epoch": 0.6901521999364816, "percentage": 35.31, "elapsed_time": "14:52:05", "remaining_time": "1 day, 3:14:10", "throughput": 334.4, "total_tokens": 17898816} {"current_steps": 14130, "total_steps": 40000, "loss": 0.0502, "lr": 0.21674099988831627, "epoch": 0.6903965016001758, "percentage": 35.33, "elapsed_time": "14:52:08", "remaining_time": "1 day, 3:13:22", "throughput": 334.5, "total_tokens": 17905248} {"current_steps": 14135, "total_steps": 40000, "loss": 0.0424, "lr": 0.21668824188260363, "epoch": 0.6906408032638702, "percentage": 35.34, "elapsed_time": "14:52:11", "remaining_time": "1 day, 3:12:35", "throughput": 334.61, "total_tokens": 17912224} {"current_steps": 14140, "total_steps": 40000, "loss": 0.0677, "lr": 0.21663547359272606, "epoch": 0.6908851049275646, "percentage": 35.35, "elapsed_time": "14:52:14", "remaining_time": "1 day, 3:11:47", "throughput": 334.71, "total_tokens": 17918432} {"current_steps": 14145, "total_steps": 40000, "loss": 0.0383, "lr": 0.216582695026821, "epoch": 0.6911294065912589, "percentage": 35.36, "elapsed_time": "14:52:17", "remaining_time": "1 day, 3:10:59", "throughput": 334.81, "total_tokens": 17925280} {"current_steps": 14150, "total_steps": 40000, "loss": 0.0624, "lr": 0.21652990619302767, "epoch": 0.6913737082549533, "percentage": 35.38, "elapsed_time": "14:52:20", "remaining_time": "1 day, 3:10:11", "throughput": 334.92, "total_tokens": 17931712} {"current_steps": 14155, "total_steps": 40000, "loss": 0.0621, "lr": 0.21647710709948673, "epoch": 0.6916180099186475, "percentage": 35.39, "elapsed_time": "14:52:23", "remaining_time": "1 day, 3:09:23", "throughput": 335.01, "total_tokens": 17937792} {"current_steps": 14160, "total_steps": 40000, "loss": 0.0556, "lr": 0.2164242977543405, "epoch": 0.6918623115823419, "percentage": 35.4, "elapsed_time": "14:52:27", "remaining_time": "1 day, 3:08:35", "throughput": 335.11, "total_tokens": 17944032} {"current_steps": 14165, "total_steps": 40000, "loss": 0.0726, "lr": 0.21637147816573277, "epoch": 0.6921066132460362, "percentage": 35.41, "elapsed_time": "14:52:30", "remaining_time": "1 day, 3:07:47", "throughput": 335.2, "total_tokens": 17950144} {"current_steps": 14170, "total_steps": 40000, "loss": 0.04, "lr": 0.21631864834180908, "epoch": 0.6923509149097306, "percentage": 35.43, "elapsed_time": "14:52:33", "remaining_time": "1 day, 3:07:00", "throughput": 335.3, "total_tokens": 17956640} {"current_steps": 14175, "total_steps": 40000, "loss": 0.0558, "lr": 0.21626580829071637, "epoch": 0.6925952165734248, "percentage": 35.44, "elapsed_time": "14:52:36", "remaining_time": "1 day, 3:06:12", "throughput": 335.41, "total_tokens": 17963200} {"current_steps": 14180, "total_steps": 40000, "loss": 0.0636, "lr": 0.21621295802060328, "epoch": 0.6928395182371192, "percentage": 35.45, "elapsed_time": "14:52:39", "remaining_time": "1 day, 3:05:24", "throughput": 335.51, "total_tokens": 17969504} {"current_steps": 14185, "total_steps": 40000, "loss": 0.0627, "lr": 0.21616009753961996, "epoch": 0.6930838199008135, "percentage": 35.46, "elapsed_time": "14:52:42", "remaining_time": "1 day, 3:04:37", "throughput": 335.61, "total_tokens": 17975840} {"current_steps": 14190, "total_steps": 40000, "loss": 0.0661, "lr": 0.2161072268559182, "epoch": 0.6933281215645078, "percentage": 35.48, "elapsed_time": "14:52:45", "remaining_time": "1 day, 3:03:49", "throughput": 335.7, "total_tokens": 17981856} {"current_steps": 14195, "total_steps": 40000, "loss": 0.0952, "lr": 0.21605434597765133, "epoch": 0.6935724232282022, "percentage": 35.49, "elapsed_time": "14:52:48", "remaining_time": "1 day, 3:03:01", "throughput": 335.79, "total_tokens": 17987712} {"current_steps": 14200, "total_steps": 40000, "loss": 0.0931, "lr": 0.21600145491297418, "epoch": 0.6938167248918965, "percentage": 35.5, "elapsed_time": "14:52:51", "remaining_time": "1 day, 3:02:13", "throughput": 335.89, "total_tokens": 17994144} {"current_steps": 14200, "total_steps": 40000, "eval_loss": 0.06763430684804916, "epoch": 0.6938167248918965, "percentage": 35.5, "elapsed_time": "15:03:31", "remaining_time": "1 day, 3:21:37", "throughput": 331.92, "total_tokens": 17994144} {"current_steps": 14205, "total_steps": 40000, "loss": 0.0797, "lr": 0.21594855367004326, "epoch": 0.6940610265555909, "percentage": 35.51, "elapsed_time": "15:03:35", "remaining_time": "1 day, 3:20:50", "throughput": 332.02, "total_tokens": 18000416} {"current_steps": 14210, "total_steps": 40000, "loss": 0.0633, "lr": 0.21589564225701663, "epoch": 0.6943053282192851, "percentage": 35.52, "elapsed_time": "15:03:38", "remaining_time": "1 day, 3:20:01", "throughput": 332.11, "total_tokens": 18006560} {"current_steps": 14215, "total_steps": 40000, "loss": 0.0652, "lr": 0.21584272068205385, "epoch": 0.6945496298829795, "percentage": 35.54, "elapsed_time": "15:03:41", "remaining_time": "1 day, 3:19:13", "throughput": 332.2, "total_tokens": 18012384} {"current_steps": 14220, "total_steps": 40000, "loss": 0.0787, "lr": 0.2157897889533161, "epoch": 0.6947939315466738, "percentage": 35.55, "elapsed_time": "15:03:44", "remaining_time": "1 day, 3:18:25", "throughput": 332.3, "total_tokens": 18018720} {"current_steps": 14225, "total_steps": 40000, "loss": 0.081, "lr": 0.21573684707896612, "epoch": 0.6950382332103682, "percentage": 35.56, "elapsed_time": "15:03:47", "remaining_time": "1 day, 3:17:37", "throughput": 332.39, "total_tokens": 18024544} {"current_steps": 14230, "total_steps": 40000, "loss": 0.059, "lr": 0.21568389506716826, "epoch": 0.6952825348740624, "percentage": 35.58, "elapsed_time": "15:03:50", "remaining_time": "1 day, 3:16:49", "throughput": 332.48, "total_tokens": 18030560} {"current_steps": 14235, "total_steps": 40000, "loss": 0.0498, "lr": 0.21563093292608831, "epoch": 0.6955268365377568, "percentage": 35.59, "elapsed_time": "15:03:53", "remaining_time": "1 day, 3:16:01", "throughput": 332.58, "total_tokens": 18037216} {"current_steps": 14240, "total_steps": 40000, "loss": 0.0758, "lr": 0.21557796066389376, "epoch": 0.6957711382014512, "percentage": 35.6, "elapsed_time": "15:03:56", "remaining_time": "1 day, 3:15:13", "throughput": 332.68, "total_tokens": 18043680} {"current_steps": 14245, "total_steps": 40000, "loss": 0.0736, "lr": 0.21552497828875353, "epoch": 0.6960154398651455, "percentage": 35.61, "elapsed_time": "15:03:59", "remaining_time": "1 day, 3:14:25", "throughput": 332.78, "total_tokens": 18049920} {"current_steps": 14250, "total_steps": 40000, "loss": 0.0864, "lr": 0.21547198580883828, "epoch": 0.6962597415288398, "percentage": 35.62, "elapsed_time": "15:04:02", "remaining_time": "1 day, 3:13:37", "throughput": 332.89, "total_tokens": 18056768} {"current_steps": 14255, "total_steps": 40000, "loss": 0.0716, "lr": 0.21541898323232, "epoch": 0.6965040431925341, "percentage": 35.64, "elapsed_time": "15:04:06", "remaining_time": "1 day, 3:12:50", "throughput": 332.99, "total_tokens": 18063296} {"current_steps": 14260, "total_steps": 40000, "loss": 0.0451, "lr": 0.2153659705673724, "epoch": 0.6967483448562285, "percentage": 35.65, "elapsed_time": "15:04:09", "remaining_time": "1 day, 3:12:02", "throughput": 333.09, "total_tokens": 18069632} {"current_steps": 14265, "total_steps": 40000, "loss": 0.0776, "lr": 0.2153129478221707, "epoch": 0.6969926465199228, "percentage": 35.66, "elapsed_time": "15:04:12", "remaining_time": "1 day, 3:11:14", "throughput": 333.19, "total_tokens": 18076416} {"current_steps": 14270, "total_steps": 40000, "loss": 0.0509, "lr": 0.21525991500489164, "epoch": 0.6972369481836171, "percentage": 35.68, "elapsed_time": "15:04:15", "remaining_time": "1 day, 3:10:26", "throughput": 333.29, "total_tokens": 18082784} {"current_steps": 14275, "total_steps": 40000, "loss": 0.0539, "lr": 0.21520687212371362, "epoch": 0.6974812498473114, "percentage": 35.69, "elapsed_time": "15:04:18", "remaining_time": "1 day, 3:09:39", "throughput": 333.38, "total_tokens": 18088896} {"current_steps": 14280, "total_steps": 40000, "loss": 0.0682, "lr": 0.21515381918681648, "epoch": 0.6977255515110058, "percentage": 35.7, "elapsed_time": "15:04:21", "remaining_time": "1 day, 3:08:51", "throughput": 333.49, "total_tokens": 18095424} {"current_steps": 14285, "total_steps": 40000, "loss": 0.058, "lr": 0.21510075620238167, "epoch": 0.6979698531747002, "percentage": 35.71, "elapsed_time": "15:04:24", "remaining_time": "1 day, 3:08:03", "throughput": 333.58, "total_tokens": 18101536} {"current_steps": 14290, "total_steps": 40000, "loss": 0.0817, "lr": 0.21504768317859208, "epoch": 0.6982141548383944, "percentage": 35.73, "elapsed_time": "15:04:27", "remaining_time": "1 day, 3:07:16", "throughput": 333.68, "total_tokens": 18108000} {"current_steps": 14295, "total_steps": 40000, "loss": 0.0632, "lr": 0.2149946001236323, "epoch": 0.6984584565020888, "percentage": 35.74, "elapsed_time": "15:04:30", "remaining_time": "1 day, 3:06:28", "throughput": 333.78, "total_tokens": 18114432} {"current_steps": 14300, "total_steps": 40000, "loss": 0.0502, "lr": 0.21494150704568848, "epoch": 0.6987027581657831, "percentage": 35.75, "elapsed_time": "15:04:33", "remaining_time": "1 day, 3:05:41", "throughput": 333.88, "total_tokens": 18120992} {"current_steps": 14305, "total_steps": 40000, "loss": 0.0699, "lr": 0.21488840395294811, "epoch": 0.6989470598294775, "percentage": 35.76, "elapsed_time": "15:04:36", "remaining_time": "1 day, 3:04:53", "throughput": 333.98, "total_tokens": 18127488} {"current_steps": 14310, "total_steps": 40000, "loss": 0.0467, "lr": 0.21483529085360042, "epoch": 0.6991913614931717, "percentage": 35.77, "elapsed_time": "15:04:40", "remaining_time": "1 day, 3:04:06", "throughput": 334.1, "total_tokens": 18135136} {"current_steps": 14315, "total_steps": 40000, "loss": 0.0631, "lr": 0.2147821677558361, "epoch": 0.6994356631568661, "percentage": 35.79, "elapsed_time": "15:04:43", "remaining_time": "1 day, 3:03:19", "throughput": 334.21, "total_tokens": 18141984} {"current_steps": 14320, "total_steps": 40000, "loss": 0.062, "lr": 0.2147290346678475, "epoch": 0.6996799648205604, "percentage": 35.8, "elapsed_time": "15:04:46", "remaining_time": "1 day, 3:02:31", "throughput": 334.3, "total_tokens": 18147776} {"current_steps": 14325, "total_steps": 40000, "loss": 0.1104, "lr": 0.21467589159782827, "epoch": 0.6999242664842548, "percentage": 35.81, "elapsed_time": "15:04:49", "remaining_time": "1 day, 3:01:43", "throughput": 334.39, "total_tokens": 18153728} {"current_steps": 14330, "total_steps": 40000, "loss": 0.0537, "lr": 0.21462273855397374, "epoch": 0.700168568147949, "percentage": 35.83, "elapsed_time": "15:04:52", "remaining_time": "1 day, 3:00:56", "throughput": 334.48, "total_tokens": 18159872} {"current_steps": 14335, "total_steps": 40000, "loss": 0.0839, "lr": 0.21456957554448083, "epoch": 0.7004128698116434, "percentage": 35.84, "elapsed_time": "15:04:55", "remaining_time": "1 day, 3:00:09", "throughput": 334.58, "total_tokens": 18166144} {"current_steps": 14340, "total_steps": 40000, "loss": 0.0413, "lr": 0.21451640257754795, "epoch": 0.7006571714753378, "percentage": 35.85, "elapsed_time": "15:04:58", "remaining_time": "1 day, 2:59:21", "throughput": 334.68, "total_tokens": 18172480} {"current_steps": 14345, "total_steps": 40000, "loss": 0.0744, "lr": 0.21446321966137508, "epoch": 0.7009014731390321, "percentage": 35.86, "elapsed_time": "15:05:01", "remaining_time": "1 day, 2:58:34", "throughput": 334.78, "total_tokens": 18178880} {"current_steps": 14350, "total_steps": 40000, "loss": 0.068, "lr": 0.21441002680416354, "epoch": 0.7011457748027264, "percentage": 35.88, "elapsed_time": "15:05:04", "remaining_time": "1 day, 2:57:47", "throughput": 334.88, "total_tokens": 18185664} {"current_steps": 14355, "total_steps": 40000, "loss": 0.076, "lr": 0.21435682401411654, "epoch": 0.7013900764664207, "percentage": 35.89, "elapsed_time": "15:05:07", "remaining_time": "1 day, 2:57:00", "throughput": 334.96, "total_tokens": 18191232} {"current_steps": 14360, "total_steps": 40000, "loss": 0.06, "lr": 0.2143036112994385, "epoch": 0.7016343781301151, "percentage": 35.9, "elapsed_time": "15:05:10", "remaining_time": "1 day, 2:56:13", "throughput": 335.06, "total_tokens": 18197632} {"current_steps": 14365, "total_steps": 40000, "loss": 0.0426, "lr": 0.21425038866833548, "epoch": 0.7018786797938094, "percentage": 35.91, "elapsed_time": "15:05:14", "remaining_time": "1 day, 2:55:25", "throughput": 335.16, "total_tokens": 18203904} {"current_steps": 14370, "total_steps": 40000, "loss": 0.0632, "lr": 0.21419715612901508, "epoch": 0.7021229814575037, "percentage": 35.93, "elapsed_time": "15:05:17", "remaining_time": "1 day, 2:54:38", "throughput": 335.26, "total_tokens": 18210560} {"current_steps": 14375, "total_steps": 40000, "loss": 0.0706, "lr": 0.21414391368968652, "epoch": 0.702367283121198, "percentage": 35.94, "elapsed_time": "15:05:20", "remaining_time": "1 day, 2:53:51", "throughput": 335.36, "total_tokens": 18216960} {"current_steps": 14380, "total_steps": 40000, "loss": 0.0439, "lr": 0.21409066135856034, "epoch": 0.7026115847848924, "percentage": 35.95, "elapsed_time": "15:05:23", "remaining_time": "1 day, 2:53:04", "throughput": 335.46, "total_tokens": 18223296} {"current_steps": 14385, "total_steps": 40000, "loss": 0.0692, "lr": 0.21403739914384878, "epoch": 0.7028558864485868, "percentage": 35.96, "elapsed_time": "15:05:26", "remaining_time": "1 day, 2:52:17", "throughput": 335.56, "total_tokens": 18229600} {"current_steps": 14390, "total_steps": 40000, "loss": 0.0609, "lr": 0.21398412705376554, "epoch": 0.703100188112281, "percentage": 35.98, "elapsed_time": "15:05:29", "remaining_time": "1 day, 2:51:30", "throughput": 335.66, "total_tokens": 18236224} {"current_steps": 14395, "total_steps": 40000, "loss": 0.0458, "lr": 0.2139308450965258, "epoch": 0.7033444897759754, "percentage": 35.99, "elapsed_time": "15:05:32", "remaining_time": "1 day, 2:50:43", "throughput": 335.76, "total_tokens": 18242624} {"current_steps": 14400, "total_steps": 40000, "loss": 0.0684, "lr": 0.21387755328034638, "epoch": 0.7035887914396697, "percentage": 36.0, "elapsed_time": "15:05:35", "remaining_time": "1 day, 2:49:56", "throughput": 335.85, "total_tokens": 18248736} {"current_steps": 14400, "total_steps": 40000, "eval_loss": 0.06816627085208893, "epoch": 0.7035887914396697, "percentage": 36.0, "elapsed_time": "15:16:15", "remaining_time": "1 day, 3:08:55", "throughput": 331.94, "total_tokens": 18248736} {"current_steps": 14405, "total_steps": 40000, "loss": 0.0728, "lr": 0.2138242516134455, "epoch": 0.7038330931033641, "percentage": 36.01, "elapsed_time": "15:16:19", "remaining_time": "1 day, 3:08:08", "throughput": 332.03, "total_tokens": 18254880} {"current_steps": 14410, "total_steps": 40000, "loss": 0.0832, "lr": 0.2137709401040429, "epoch": 0.7040773947670583, "percentage": 36.02, "elapsed_time": "15:16:22", "remaining_time": "1 day, 3:07:20", "throughput": 332.12, "total_tokens": 18260960} {"current_steps": 14415, "total_steps": 40000, "loss": 0.0682, "lr": 0.21371761876036, "epoch": 0.7043216964307527, "percentage": 36.04, "elapsed_time": "15:16:25", "remaining_time": "1 day, 3:06:33", "throughput": 332.22, "total_tokens": 18267360} {"current_steps": 14420, "total_steps": 40000, "loss": 0.0711, "lr": 0.21366428759061956, "epoch": 0.704565998094447, "percentage": 36.05, "elapsed_time": "15:16:28", "remaining_time": "1 day, 3:05:46", "throughput": 332.32, "total_tokens": 18273696} {"current_steps": 14425, "total_steps": 40000, "loss": 0.0779, "lr": 0.2136109466030459, "epoch": 0.7048102997581414, "percentage": 36.06, "elapsed_time": "15:16:31", "remaining_time": "1 day, 3:04:58", "throughput": 332.41, "total_tokens": 18280160} {"current_steps": 14430, "total_steps": 40000, "loss": 0.0818, "lr": 0.2135575958058649, "epoch": 0.7050546014218357, "percentage": 36.08, "elapsed_time": "15:16:35", "remaining_time": "1 day, 3:04:11", "throughput": 332.51, "total_tokens": 18286432} {"current_steps": 14435, "total_steps": 40000, "loss": 0.0501, "lr": 0.2135042352073039, "epoch": 0.70529890308553, "percentage": 36.09, "elapsed_time": "15:16:38", "remaining_time": "1 day, 3:03:24", "throughput": 332.61, "total_tokens": 18293056} {"current_steps": 14440, "total_steps": 40000, "loss": 0.0643, "lr": 0.2134508648155918, "epoch": 0.7055432047492244, "percentage": 36.1, "elapsed_time": "15:16:41", "remaining_time": "1 day, 3:02:36", "throughput": 332.71, "total_tokens": 18299552} {"current_steps": 14445, "total_steps": 40000, "loss": 0.071, "lr": 0.213397484638959, "epoch": 0.7057875064129187, "percentage": 36.11, "elapsed_time": "15:16:44", "remaining_time": "1 day, 3:01:49", "throughput": 332.81, "total_tokens": 18305824} {"current_steps": 14450, "total_steps": 40000, "loss": 0.0694, "lr": 0.21334409468563728, "epoch": 0.706031808076613, "percentage": 36.12, "elapsed_time": "15:16:47", "remaining_time": "1 day, 3:01:02", "throughput": 332.9, "total_tokens": 18311904} {"current_steps": 14455, "total_steps": 40000, "loss": 0.0777, "lr": 0.2132906949638602, "epoch": 0.7062761097403073, "percentage": 36.14, "elapsed_time": "15:16:50", "remaining_time": "1 day, 3:00:14", "throughput": 332.99, "total_tokens": 18318112} {"current_steps": 14460, "total_steps": 40000, "loss": 0.0833, "lr": 0.21323728548186255, "epoch": 0.7065204114040017, "percentage": 36.15, "elapsed_time": "15:16:53", "remaining_time": "1 day, 2:59:27", "throughput": 333.1, "total_tokens": 18324960} {"current_steps": 14465, "total_steps": 40000, "loss": 0.0574, "lr": 0.21318386624788088, "epoch": 0.706764713067696, "percentage": 36.16, "elapsed_time": "15:16:56", "remaining_time": "1 day, 2:58:40", "throughput": 333.2, "total_tokens": 18331296} {"current_steps": 14470, "total_steps": 40000, "loss": 0.0511, "lr": 0.21313043727015288, "epoch": 0.7070090147313903, "percentage": 36.18, "elapsed_time": "15:16:59", "remaining_time": "1 day, 2:57:53", "throughput": 333.3, "total_tokens": 18338144} {"current_steps": 14475, "total_steps": 40000, "loss": 0.0643, "lr": 0.2130769985569182, "epoch": 0.7072533163950846, "percentage": 36.19, "elapsed_time": "15:17:02", "remaining_time": "1 day, 2:57:06", "throughput": 333.39, "total_tokens": 18344160} {"current_steps": 14480, "total_steps": 40000, "loss": 0.0678, "lr": 0.21302355011641766, "epoch": 0.707497618058779, "percentage": 36.2, "elapsed_time": "15:17:05", "remaining_time": "1 day, 2:56:19", "throughput": 333.5, "total_tokens": 18351136} {"current_steps": 14485, "total_steps": 40000, "loss": 0.062, "lr": 0.21297009195689365, "epoch": 0.7077419197224734, "percentage": 36.21, "elapsed_time": "15:17:09", "remaining_time": "1 day, 2:55:32", "throughput": 333.59, "total_tokens": 18357312} {"current_steps": 14490, "total_steps": 40000, "loss": 0.065, "lr": 0.21291662408659015, "epoch": 0.7079862213861676, "percentage": 36.23, "elapsed_time": "15:17:12", "remaining_time": "1 day, 2:54:45", "throughput": 333.69, "total_tokens": 18363648} {"current_steps": 14495, "total_steps": 40000, "loss": 0.0863, "lr": 0.21286314651375254, "epoch": 0.708230523049862, "percentage": 36.24, "elapsed_time": "15:17:15", "remaining_time": "1 day, 2:53:58", "throughput": 333.78, "total_tokens": 18369600} {"current_steps": 14500, "total_steps": 40000, "loss": 0.0862, "lr": 0.2128096592466278, "epoch": 0.7084748247135563, "percentage": 36.25, "elapsed_time": "15:17:18", "remaining_time": "1 day, 2:53:11", "throughput": 333.88, "total_tokens": 18376096} {"current_steps": 14505, "total_steps": 40000, "loss": 0.0842, "lr": 0.21275616229346428, "epoch": 0.7087191263772507, "percentage": 36.26, "elapsed_time": "15:17:21", "remaining_time": "1 day, 2:52:24", "throughput": 333.98, "total_tokens": 18382432} {"current_steps": 14510, "total_steps": 40000, "loss": 0.05, "lr": 0.21270265566251184, "epoch": 0.7089634280409449, "percentage": 36.27, "elapsed_time": "15:17:24", "remaining_time": "1 day, 2:51:37", "throughput": 334.07, "total_tokens": 18388736} {"current_steps": 14515, "total_steps": 40000, "loss": 0.0689, "lr": 0.21264913936202193, "epoch": 0.7092077297046393, "percentage": 36.29, "elapsed_time": "15:17:27", "remaining_time": "1 day, 2:50:50", "throughput": 334.16, "total_tokens": 18394912} {"current_steps": 14520, "total_steps": 40000, "loss": 0.056, "lr": 0.2125956134002475, "epoch": 0.7094520313683336, "percentage": 36.3, "elapsed_time": "15:17:30", "remaining_time": "1 day, 2:50:04", "throughput": 334.27, "total_tokens": 18401728} {"current_steps": 14525, "total_steps": 40000, "loss": 0.0813, "lr": 0.2125420777854428, "epoch": 0.709696333032028, "percentage": 36.31, "elapsed_time": "15:17:33", "remaining_time": "1 day, 2:49:17", "throughput": 334.37, "total_tokens": 18408128} {"current_steps": 14530, "total_steps": 40000, "loss": 0.0682, "lr": 0.21248853252586372, "epoch": 0.7099406346957223, "percentage": 36.33, "elapsed_time": "15:17:36", "remaining_time": "1 day, 2:48:30", "throughput": 334.46, "total_tokens": 18414528} {"current_steps": 14535, "total_steps": 40000, "loss": 0.057, "lr": 0.21243497762976774, "epoch": 0.7101849363594166, "percentage": 36.34, "elapsed_time": "15:17:39", "remaining_time": "1 day, 2:47:43", "throughput": 334.56, "total_tokens": 18420736} {"current_steps": 14540, "total_steps": 40000, "loss": 0.0585, "lr": 0.21238141310541356, "epoch": 0.710429238023111, "percentage": 36.35, "elapsed_time": "15:17:42", "remaining_time": "1 day, 2:46:57", "throughput": 334.66, "total_tokens": 18427264} {"current_steps": 14545, "total_steps": 40000, "loss": 0.0619, "lr": 0.21232783896106153, "epoch": 0.7106735396868052, "percentage": 36.36, "elapsed_time": "15:17:46", "remaining_time": "1 day, 2:46:10", "throughput": 334.75, "total_tokens": 18433504} {"current_steps": 14550, "total_steps": 40000, "loss": 0.0674, "lr": 0.21227425520497345, "epoch": 0.7109178413504996, "percentage": 36.38, "elapsed_time": "15:17:49", "remaining_time": "1 day, 2:45:23", "throughput": 334.85, "total_tokens": 18439872} {"current_steps": 14555, "total_steps": 40000, "loss": 0.0786, "lr": 0.2122206618454127, "epoch": 0.7111621430141939, "percentage": 36.39, "elapsed_time": "15:17:52", "remaining_time": "1 day, 2:44:37", "throughput": 334.94, "total_tokens": 18445920} {"current_steps": 14560, "total_steps": 40000, "loss": 0.0653, "lr": 0.2121670588906439, "epoch": 0.7114064446778883, "percentage": 36.4, "elapsed_time": "15:17:55", "remaining_time": "1 day, 2:43:50", "throughput": 335.04, "total_tokens": 18452544} {"current_steps": 14565, "total_steps": 40000, "loss": 0.0694, "lr": 0.21211344634893345, "epoch": 0.7116507463415825, "percentage": 36.41, "elapsed_time": "15:17:58", "remaining_time": "1 day, 2:43:04", "throughput": 335.15, "total_tokens": 18459296} {"current_steps": 14570, "total_steps": 40000, "loss": 0.0738, "lr": 0.21205982422854897, "epoch": 0.7118950480052769, "percentage": 36.43, "elapsed_time": "15:18:01", "remaining_time": "1 day, 2:42:17", "throughput": 335.24, "total_tokens": 18465600} {"current_steps": 14575, "total_steps": 40000, "loss": 0.11, "lr": 0.21200619253775974, "epoch": 0.7121393496689713, "percentage": 36.44, "elapsed_time": "15:18:04", "remaining_time": "1 day, 2:41:31", "throughput": 335.34, "total_tokens": 18472384} {"current_steps": 14580, "total_steps": 40000, "loss": 0.0565, "lr": 0.21195255128483637, "epoch": 0.7123836513326656, "percentage": 36.45, "elapsed_time": "15:18:07", "remaining_time": "1 day, 2:40:44", "throughput": 335.44, "total_tokens": 18478912} {"current_steps": 14585, "total_steps": 40000, "loss": 0.0652, "lr": 0.21189890047805102, "epoch": 0.71262795299636, "percentage": 36.46, "elapsed_time": "15:18:11", "remaining_time": "1 day, 2:39:58", "throughput": 335.54, "total_tokens": 18485152} {"current_steps": 14590, "total_steps": 40000, "loss": 0.0604, "lr": 0.21184524012567735, "epoch": 0.7128722546600542, "percentage": 36.48, "elapsed_time": "15:18:14", "remaining_time": "1 day, 2:39:12", "throughput": 335.63, "total_tokens": 18491232} {"current_steps": 14595, "total_steps": 40000, "loss": 0.0833, "lr": 0.2117915702359905, "epoch": 0.7131165563237486, "percentage": 36.49, "elapsed_time": "15:18:17", "remaining_time": "1 day, 2:38:25", "throughput": 335.73, "total_tokens": 18497728} {"current_steps": 14600, "total_steps": 40000, "loss": 0.05, "lr": 0.211737890817267, "epoch": 0.7133608579874429, "percentage": 36.5, "elapsed_time": "15:18:20", "remaining_time": "1 day, 2:37:39", "throughput": 335.84, "total_tokens": 18504672} {"current_steps": 14600, "total_steps": 40000, "eval_loss": 0.06778160482645035, "epoch": 0.7133608579874429, "percentage": 36.5, "elapsed_time": "15:29:00", "remaining_time": "1 day, 2:56:13", "throughput": 331.98, "total_tokens": 18504672} {"current_steps": 14605, "total_steps": 40000, "loss": 0.0841, "lr": 0.21168420187778483, "epoch": 0.7136051596511372, "percentage": 36.51, "elapsed_time": "15:29:04", "remaining_time": "1 day, 2:55:27", "throughput": 332.07, "total_tokens": 18510816} {"current_steps": 14610, "total_steps": 40000, "loss": 0.0545, "lr": 0.21163050342582362, "epoch": 0.7138494613148315, "percentage": 36.52, "elapsed_time": "15:29:07", "remaining_time": "1 day, 2:54:40", "throughput": 332.16, "total_tokens": 18517216} {"current_steps": 14615, "total_steps": 40000, "loss": 0.0688, "lr": 0.21157679546966426, "epoch": 0.7140937629785259, "percentage": 36.54, "elapsed_time": "15:29:10", "remaining_time": "1 day, 2:53:54", "throughput": 332.26, "total_tokens": 18523552} {"current_steps": 14620, "total_steps": 40000, "loss": 0.0747, "lr": 0.2115230780175892, "epoch": 0.7143380646422202, "percentage": 36.55, "elapsed_time": "15:29:13", "remaining_time": "1 day, 2:53:07", "throughput": 332.36, "total_tokens": 18530176} {"current_steps": 14625, "total_steps": 40000, "loss": 0.0843, "lr": 0.21146935107788237, "epoch": 0.7145823663059145, "percentage": 36.56, "elapsed_time": "15:29:16", "remaining_time": "1 day, 2:52:20", "throughput": 332.45, "total_tokens": 18536192} {"current_steps": 14630, "total_steps": 40000, "loss": 0.0618, "lr": 0.21141561465882916, "epoch": 0.7148266679696089, "percentage": 36.58, "elapsed_time": "15:29:19", "remaining_time": "1 day, 2:51:33", "throughput": 332.54, "total_tokens": 18542368} {"current_steps": 14635, "total_steps": 40000, "loss": 0.0981, "lr": 0.21136186876871635, "epoch": 0.7150709696333032, "percentage": 36.59, "elapsed_time": "15:29:22", "remaining_time": "1 day, 2:50:46", "throughput": 332.63, "total_tokens": 18548544} {"current_steps": 14640, "total_steps": 40000, "loss": 0.0629, "lr": 0.21130811341583225, "epoch": 0.7153152712969976, "percentage": 36.6, "elapsed_time": "15:29:26", "remaining_time": "1 day, 2:50:00", "throughput": 332.73, "total_tokens": 18554976} {"current_steps": 14645, "total_steps": 40000, "loss": 0.0699, "lr": 0.21125434860846667, "epoch": 0.7155595729606918, "percentage": 36.61, "elapsed_time": "15:29:29", "remaining_time": "1 day, 2:49:13", "throughput": 332.82, "total_tokens": 18561152} {"current_steps": 14650, "total_steps": 40000, "loss": 0.0726, "lr": 0.2112005743549107, "epoch": 0.7158038746243862, "percentage": 36.62, "elapsed_time": "15:29:32", "remaining_time": "1 day, 2:48:27", "throughput": 332.92, "total_tokens": 18567904} {"current_steps": 14655, "total_steps": 40000, "loss": 0.0937, "lr": 0.21114679066345707, "epoch": 0.7160481762880805, "percentage": 36.64, "elapsed_time": "15:29:35", "remaining_time": "1 day, 2:47:40", "throughput": 333.01, "total_tokens": 18574016} {"current_steps": 14660, "total_steps": 40000, "loss": 0.0784, "lr": 0.21109299754239993, "epoch": 0.7162924779517749, "percentage": 36.65, "elapsed_time": "15:29:38", "remaining_time": "1 day, 2:46:53", "throughput": 333.11, "total_tokens": 18580608} {"current_steps": 14665, "total_steps": 40000, "loss": 0.0631, "lr": 0.21103919500003482, "epoch": 0.7165367796154691, "percentage": 36.66, "elapsed_time": "15:29:41", "remaining_time": "1 day, 2:46:07", "throughput": 333.2, "total_tokens": 18586656} {"current_steps": 14670, "total_steps": 40000, "loss": 0.0758, "lr": 0.21098538304465872, "epoch": 0.7167810812791635, "percentage": 36.68, "elapsed_time": "15:29:44", "remaining_time": "1 day, 2:45:20", "throughput": 333.3, "total_tokens": 18593248} {"current_steps": 14675, "total_steps": 40000, "loss": 0.0596, "lr": 0.2109315616845702, "epoch": 0.7170253829428579, "percentage": 36.69, "elapsed_time": "15:29:47", "remaining_time": "1 day, 2:44:34", "throughput": 333.4, "total_tokens": 18599616} {"current_steps": 14680, "total_steps": 40000, "loss": 0.0502, "lr": 0.21087773092806925, "epoch": 0.7172696846065522, "percentage": 36.7, "elapsed_time": "15:29:50", "remaining_time": "1 day, 2:43:47", "throughput": 333.49, "total_tokens": 18605376} {"current_steps": 14685, "total_steps": 40000, "loss": 0.108, "lr": 0.21082389078345704, "epoch": 0.7175139862702465, "percentage": 36.71, "elapsed_time": "15:29:53", "remaining_time": "1 day, 2:43:01", "throughput": 333.59, "total_tokens": 18612064} {"current_steps": 14690, "total_steps": 40000, "loss": 0.101, "lr": 0.2107700412590365, "epoch": 0.7177582879339408, "percentage": 36.73, "elapsed_time": "15:29:56", "remaining_time": "1 day, 2:42:14", "throughput": 333.68, "total_tokens": 18618080} {"current_steps": 14695, "total_steps": 40000, "loss": 0.083, "lr": 0.210716182363112, "epoch": 0.7180025895976352, "percentage": 36.74, "elapsed_time": "15:29:59", "remaining_time": "1 day, 2:41:28", "throughput": 333.76, "total_tokens": 18624000} {"current_steps": 14700, "total_steps": 40000, "loss": 0.0581, "lr": 0.2106623141039891, "epoch": 0.7182468912613295, "percentage": 36.75, "elapsed_time": "15:30:02", "remaining_time": "1 day, 2:40:41", "throughput": 333.85, "total_tokens": 18630016} {"current_steps": 14705, "total_steps": 40000, "loss": 0.0802, "lr": 0.21060843648997507, "epoch": 0.7184911929250238, "percentage": 36.76, "elapsed_time": "15:30:05", "remaining_time": "1 day, 2:39:55", "throughput": 333.95, "total_tokens": 18636352} {"current_steps": 14710, "total_steps": 40000, "loss": 0.0757, "lr": 0.21055454952937844, "epoch": 0.7187354945887181, "percentage": 36.78, "elapsed_time": "15:30:08", "remaining_time": "1 day, 2:39:08", "throughput": 334.04, "total_tokens": 18642336} {"current_steps": 14715, "total_steps": 40000, "loss": 0.0992, "lr": 0.21050065323050937, "epoch": 0.7189797962524125, "percentage": 36.79, "elapsed_time": "15:30:11", "remaining_time": "1 day, 2:38:22", "throughput": 334.13, "total_tokens": 18648608} {"current_steps": 14720, "total_steps": 40000, "loss": 0.0788, "lr": 0.21044674760167928, "epoch": 0.7192240979161069, "percentage": 36.8, "elapsed_time": "15:30:15", "remaining_time": "1 day, 2:37:36", "throughput": 334.23, "total_tokens": 18655008} {"current_steps": 14725, "total_steps": 40000, "loss": 0.077, "lr": 0.210392832651201, "epoch": 0.7194683995798011, "percentage": 36.81, "elapsed_time": "15:30:18", "remaining_time": "1 day, 2:36:50", "throughput": 334.32, "total_tokens": 18660928} {"current_steps": 14730, "total_steps": 40000, "loss": 0.0941, "lr": 0.210338908387389, "epoch": 0.7197127012434955, "percentage": 36.83, "elapsed_time": "15:30:21", "remaining_time": "1 day, 2:36:03", "throughput": 334.41, "total_tokens": 18667328} {"current_steps": 14735, "total_steps": 40000, "loss": 0.0835, "lr": 0.21028497481855912, "epoch": 0.7199570029071898, "percentage": 36.84, "elapsed_time": "15:30:24", "remaining_time": "1 day, 2:35:17", "throughput": 334.5, "total_tokens": 18672960} {"current_steps": 14740, "total_steps": 40000, "loss": 0.074, "lr": 0.21023103195302847, "epoch": 0.7202013045708842, "percentage": 36.85, "elapsed_time": "15:30:27", "remaining_time": "1 day, 2:34:31", "throughput": 334.59, "total_tokens": 18679264} {"current_steps": 14745, "total_steps": 40000, "loss": 0.0747, "lr": 0.21017707979911582, "epoch": 0.7204456062345784, "percentage": 36.86, "elapsed_time": "15:30:30", "remaining_time": "1 day, 2:33:45", "throughput": 334.68, "total_tokens": 18685536} {"current_steps": 14750, "total_steps": 40000, "loss": 0.058, "lr": 0.21012311836514122, "epoch": 0.7206899078982728, "percentage": 36.88, "elapsed_time": "15:30:33", "remaining_time": "1 day, 2:32:58", "throughput": 334.77, "total_tokens": 18691552} {"current_steps": 14755, "total_steps": 40000, "loss": 0.1247, "lr": 0.21006914765942622, "epoch": 0.7209342095619671, "percentage": 36.89, "elapsed_time": "15:30:36", "remaining_time": "1 day, 2:32:13", "throughput": 334.87, "total_tokens": 18698048} {"current_steps": 14760, "total_steps": 40000, "loss": 0.0751, "lr": 0.2100151676902938, "epoch": 0.7211785112256615, "percentage": 36.9, "elapsed_time": "15:30:39", "remaining_time": "1 day, 2:31:26", "throughput": 334.96, "total_tokens": 18704032} {"current_steps": 14765, "total_steps": 40000, "loss": 0.0426, "lr": 0.2099611784660683, "epoch": 0.7214228128893557, "percentage": 36.91, "elapsed_time": "15:30:42", "remaining_time": "1 day, 2:30:41", "throughput": 335.06, "total_tokens": 18710752} {"current_steps": 14770, "total_steps": 40000, "loss": 0.1048, "lr": 0.20990717999507552, "epoch": 0.7216671145530501, "percentage": 36.93, "elapsed_time": "15:30:45", "remaining_time": "1 day, 2:29:54", "throughput": 335.15, "total_tokens": 18716608} {"current_steps": 14775, "total_steps": 40000, "loss": 0.0624, "lr": 0.20985317228564276, "epoch": 0.7219114162167445, "percentage": 36.94, "elapsed_time": "15:30:48", "remaining_time": "1 day, 2:29:08", "throughput": 335.24, "total_tokens": 18722752} {"current_steps": 14780, "total_steps": 40000, "loss": 0.0625, "lr": 0.20979915534609872, "epoch": 0.7221557178804388, "percentage": 36.95, "elapsed_time": "15:30:51", "remaining_time": "1 day, 2:28:22", "throughput": 335.33, "total_tokens": 18728800} {"current_steps": 14785, "total_steps": 40000, "loss": 0.0714, "lr": 0.20974512918477342, "epoch": 0.7224000195441331, "percentage": 36.96, "elapsed_time": "15:30:54", "remaining_time": "1 day, 2:27:37", "throughput": 335.43, "total_tokens": 18735072} {"current_steps": 14790, "total_steps": 40000, "loss": 0.0437, "lr": 0.2096910938099984, "epoch": 0.7226443212078274, "percentage": 36.98, "elapsed_time": "15:30:57", "remaining_time": "1 day, 2:26:51", "throughput": 335.52, "total_tokens": 18741600} {"current_steps": 14795, "total_steps": 40000, "loss": 0.084, "lr": 0.2096370492301066, "epoch": 0.7228886228715218, "percentage": 36.99, "elapsed_time": "15:31:00", "remaining_time": "1 day, 2:26:05", "throughput": 335.61, "total_tokens": 18747680} {"current_steps": 14800, "total_steps": 40000, "loss": 0.0822, "lr": 0.2095829954534323, "epoch": 0.723132924535216, "percentage": 37.0, "elapsed_time": "15:31:03", "remaining_time": "1 day, 2:25:19", "throughput": 335.71, "total_tokens": 18754208} {"current_steps": 14800, "total_steps": 40000, "eval_loss": 0.0717802569270134, "epoch": 0.723132924535216, "percentage": 37.0, "elapsed_time": "15:41:44", "remaining_time": "1 day, 2:43:30", "throughput": 331.91, "total_tokens": 18754208} {"current_steps": 14805, "total_steps": 40000, "loss": 0.0689, "lr": 0.2095289324883114, "epoch": 0.7233772261989104, "percentage": 37.01, "elapsed_time": "15:41:48", "remaining_time": "1 day, 2:42:44", "throughput": 331.99, "total_tokens": 18760192} {"current_steps": 14810, "total_steps": 40000, "loss": 0.0608, "lr": 0.20947486034308097, "epoch": 0.7236215278626047, "percentage": 37.03, "elapsed_time": "15:41:51", "remaining_time": "1 day, 2:41:58", "throughput": 332.09, "total_tokens": 18766976} {"current_steps": 14815, "total_steps": 40000, "loss": 0.0777, "lr": 0.2094207790260797, "epoch": 0.7238658295262991, "percentage": 37.04, "elapsed_time": "15:41:54", "remaining_time": "1 day, 2:41:12", "throughput": 332.18, "total_tokens": 18773152} {"current_steps": 14820, "total_steps": 40000, "loss": 0.0736, "lr": 0.20936668854564758, "epoch": 0.7241101311899935, "percentage": 37.05, "elapsed_time": "15:41:57", "remaining_time": "1 day, 2:40:26", "throughput": 332.27, "total_tokens": 18779264} {"current_steps": 14825, "total_steps": 40000, "loss": 0.0461, "lr": 0.20931258891012602, "epoch": 0.7243544328536877, "percentage": 37.06, "elapsed_time": "15:42:00", "remaining_time": "1 day, 2:39:40", "throughput": 332.37, "total_tokens": 18785952} {"current_steps": 14830, "total_steps": 40000, "loss": 0.0369, "lr": 0.20925848012785792, "epoch": 0.7245987345173821, "percentage": 37.08, "elapsed_time": "15:42:03", "remaining_time": "1 day, 2:38:54", "throughput": 332.48, "total_tokens": 18792768} {"current_steps": 14835, "total_steps": 40000, "loss": 0.089, "lr": 0.20920436220718747, "epoch": 0.7248430361810764, "percentage": 37.09, "elapsed_time": "15:42:06", "remaining_time": "1 day, 2:38:07", "throughput": 332.56, "total_tokens": 18798656} {"current_steps": 14840, "total_steps": 40000, "loss": 0.0627, "lr": 0.20915023515646033, "epoch": 0.7250873378447708, "percentage": 37.1, "elapsed_time": "15:42:09", "remaining_time": "1 day, 2:37:21", "throughput": 332.66, "total_tokens": 18805344} {"current_steps": 14845, "total_steps": 40000, "loss": 0.0508, "lr": 0.20909609898402368, "epoch": 0.725331639508465, "percentage": 37.11, "elapsed_time": "15:42:12", "remaining_time": "1 day, 2:36:35", "throughput": 332.75, "total_tokens": 18811456} {"current_steps": 14850, "total_steps": 40000, "loss": 0.0709, "lr": 0.2090419536982258, "epoch": 0.7255759411721594, "percentage": 37.12, "elapsed_time": "15:42:15", "remaining_time": "1 day, 2:35:49", "throughput": 332.84, "total_tokens": 18817216} {"current_steps": 14855, "total_steps": 40000, "loss": 0.0719, "lr": 0.2089877993074168, "epoch": 0.7258202428358537, "percentage": 37.14, "elapsed_time": "15:42:18", "remaining_time": "1 day, 2:35:03", "throughput": 332.93, "total_tokens": 18823360} {"current_steps": 14860, "total_steps": 40000, "loss": 0.0725, "lr": 0.20893363581994784, "epoch": 0.726064544499548, "percentage": 37.15, "elapsed_time": "15:42:22", "remaining_time": "1 day, 2:34:17", "throughput": 333.02, "total_tokens": 18829408} {"current_steps": 14865, "total_steps": 40000, "loss": 0.0604, "lr": 0.2088794632441716, "epoch": 0.7263088461632423, "percentage": 37.16, "elapsed_time": "15:42:25", "remaining_time": "1 day, 2:33:31", "throughput": 333.11, "total_tokens": 18835872} {"current_steps": 14870, "total_steps": 40000, "loss": 0.0628, "lr": 0.20882528158844219, "epoch": 0.7265531478269367, "percentage": 37.18, "elapsed_time": "15:42:28", "remaining_time": "1 day, 2:32:45", "throughput": 333.2, "total_tokens": 18842048} {"current_steps": 14875, "total_steps": 40000, "loss": 0.0495, "lr": 0.20877109086111514, "epoch": 0.7267974494906311, "percentage": 37.19, "elapsed_time": "15:42:31", "remaining_time": "1 day, 2:31:59", "throughput": 333.3, "total_tokens": 18848512} {"current_steps": 14880, "total_steps": 40000, "loss": 0.0579, "lr": 0.2087168910705473, "epoch": 0.7270417511543253, "percentage": 37.2, "elapsed_time": "15:42:34", "remaining_time": "1 day, 2:31:13", "throughput": 333.39, "total_tokens": 18854816} {"current_steps": 14885, "total_steps": 40000, "loss": 0.0756, "lr": 0.208662682225097, "epoch": 0.7272860528180197, "percentage": 37.21, "elapsed_time": "15:42:37", "remaining_time": "1 day, 2:30:28", "throughput": 333.49, "total_tokens": 18861376} {"current_steps": 14890, "total_steps": 40000, "loss": 0.0559, "lr": 0.2086084643331239, "epoch": 0.727530354481714, "percentage": 37.23, "elapsed_time": "15:42:40", "remaining_time": "1 day, 2:29:42", "throughput": 333.58, "total_tokens": 18867552} {"current_steps": 14895, "total_steps": 40000, "loss": 0.0979, "lr": 0.20855423740298906, "epoch": 0.7277746561454084, "percentage": 37.24, "elapsed_time": "15:42:43", "remaining_time": "1 day, 2:28:56", "throughput": 333.67, "total_tokens": 18873664} {"current_steps": 14900, "total_steps": 40000, "loss": 0.0652, "lr": 0.208500001443055, "epoch": 0.7280189578091026, "percentage": 37.25, "elapsed_time": "15:42:46", "remaining_time": "1 day, 2:28:10", "throughput": 333.77, "total_tokens": 18880224} {"current_steps": 14905, "total_steps": 40000, "loss": 0.0752, "lr": 0.20844575646168553, "epoch": 0.728263259472797, "percentage": 37.26, "elapsed_time": "15:42:49", "remaining_time": "1 day, 2:27:24", "throughput": 333.85, "total_tokens": 18885952} {"current_steps": 14910, "total_steps": 40000, "loss": 0.0785, "lr": 0.20839150246724594, "epoch": 0.7285075611364913, "percentage": 37.28, "elapsed_time": "15:42:52", "remaining_time": "1 day, 2:26:38", "throughput": 333.94, "total_tokens": 18891968} {"current_steps": 14915, "total_steps": 40000, "loss": 0.0555, "lr": 0.20833723946810287, "epoch": 0.7287518628001857, "percentage": 37.29, "elapsed_time": "15:42:56", "remaining_time": "1 day, 2:25:53", "throughput": 334.04, "total_tokens": 18898624} {"current_steps": 14920, "total_steps": 40000, "loss": 0.041, "lr": 0.20828296747262437, "epoch": 0.72899616446388, "percentage": 37.3, "elapsed_time": "15:42:59", "remaining_time": "1 day, 2:25:07", "throughput": 334.14, "total_tokens": 18905088} {"current_steps": 14925, "total_steps": 40000, "loss": 0.098, "lr": 0.20822868648917986, "epoch": 0.7292404661275743, "percentage": 37.31, "elapsed_time": "15:43:02", "remaining_time": "1 day, 2:24:21", "throughput": 334.23, "total_tokens": 18911296} {"current_steps": 14930, "total_steps": 40000, "loss": 0.053, "lr": 0.20817439652614017, "epoch": 0.7294847677912687, "percentage": 37.33, "elapsed_time": "15:43:05", "remaining_time": "1 day, 2:23:36", "throughput": 334.31, "total_tokens": 18917152} {"current_steps": 14935, "total_steps": 40000, "loss": 0.054, "lr": 0.20812009759187744, "epoch": 0.729729069454963, "percentage": 37.34, "elapsed_time": "15:43:08", "remaining_time": "1 day, 2:22:50", "throughput": 334.4, "total_tokens": 18922944} {"current_steps": 14940, "total_steps": 40000, "loss": 0.0612, "lr": 0.2080657896947653, "epoch": 0.7299733711186573, "percentage": 37.35, "elapsed_time": "15:43:11", "remaining_time": "1 day, 2:22:05", "throughput": 334.5, "total_tokens": 18929696} {"current_steps": 14945, "total_steps": 40000, "loss": 0.0579, "lr": 0.2080114728431787, "epoch": 0.7302176727823516, "percentage": 37.36, "elapsed_time": "15:43:14", "remaining_time": "1 day, 2:21:19", "throughput": 334.59, "total_tokens": 18935872} {"current_steps": 14950, "total_steps": 40000, "loss": 0.0542, "lr": 0.20795714704549392, "epoch": 0.730461974446046, "percentage": 37.38, "elapsed_time": "15:43:17", "remaining_time": "1 day, 2:20:33", "throughput": 334.68, "total_tokens": 18941920} {"current_steps": 14955, "total_steps": 40000, "loss": 0.0636, "lr": 0.20790281231008875, "epoch": 0.7307062761097403, "percentage": 37.39, "elapsed_time": "15:43:20", "remaining_time": "1 day, 2:19:48", "throughput": 334.77, "total_tokens": 18948192} {"current_steps": 14960, "total_steps": 40000, "loss": 0.051, "lr": 0.20784846864534226, "epoch": 0.7309505777734346, "percentage": 37.4, "elapsed_time": "15:43:23", "remaining_time": "1 day, 2:19:03", "throughput": 334.87, "total_tokens": 18954624} {"current_steps": 14965, "total_steps": 40000, "loss": 0.069, "lr": 0.20779411605963496, "epoch": 0.731194879437129, "percentage": 37.41, "elapsed_time": "15:43:26", "remaining_time": "1 day, 2:18:17", "throughput": 334.96, "total_tokens": 18961056} {"current_steps": 14970, "total_steps": 40000, "loss": 0.1014, "lr": 0.2077397545613487, "epoch": 0.7314391811008233, "percentage": 37.43, "elapsed_time": "15:43:29", "remaining_time": "1 day, 2:17:32", "throughput": 335.05, "total_tokens": 18967392} {"current_steps": 14975, "total_steps": 40000, "loss": 0.0665, "lr": 0.20768538415886661, "epoch": 0.7316834827645177, "percentage": 37.44, "elapsed_time": "15:43:32", "remaining_time": "1 day, 2:16:46", "throughput": 335.15, "total_tokens": 18973568} {"current_steps": 14980, "total_steps": 40000, "loss": 0.0315, "lr": 0.20763100486057343, "epoch": 0.7319277844282119, "percentage": 37.45, "elapsed_time": "15:43:35", "remaining_time": "1 day, 2:16:01", "throughput": 335.24, "total_tokens": 18979872} {"current_steps": 14985, "total_steps": 40000, "loss": 0.0631, "lr": 0.20757661667485502, "epoch": 0.7321720860919063, "percentage": 37.46, "elapsed_time": "15:43:39", "remaining_time": "1 day, 2:15:16", "throughput": 335.34, "total_tokens": 18986752} {"current_steps": 14990, "total_steps": 40000, "loss": 0.1075, "lr": 0.2075222196100988, "epoch": 0.7324163877556006, "percentage": 37.48, "elapsed_time": "15:43:42", "remaining_time": "1 day, 2:14:30", "throughput": 335.43, "total_tokens": 18992800} {"current_steps": 14995, "total_steps": 40000, "loss": 0.08, "lr": 0.20746781367469344, "epoch": 0.732660689419295, "percentage": 37.49, "elapsed_time": "15:43:45", "remaining_time": "1 day, 2:13:45", "throughput": 335.54, "total_tokens": 18999840} {"current_steps": 15000, "total_steps": 40000, "loss": 0.0777, "lr": 0.207413398877029, "epoch": 0.7329049910829892, "percentage": 37.5, "elapsed_time": "15:43:48", "remaining_time": "1 day, 2:13:00", "throughput": 335.62, "total_tokens": 19005696} {"current_steps": 15000, "total_steps": 40000, "eval_loss": 0.06825573742389679, "epoch": 0.7329049910829892, "percentage": 37.5, "elapsed_time": "15:54:28", "remaining_time": "1 day, 2:30:47", "throughput": 331.87, "total_tokens": 19005696} {"current_steps": 15005, "total_steps": 40000, "loss": 0.0513, "lr": 0.20735897522549698, "epoch": 0.7331492927466836, "percentage": 37.51, "elapsed_time": "15:54:32", "remaining_time": "1 day, 2:30:02", "throughput": 331.96, "total_tokens": 19012224} {"current_steps": 15010, "total_steps": 40000, "loss": 0.0585, "lr": 0.2073045427284902, "epoch": 0.7333935944103779, "percentage": 37.52, "elapsed_time": "15:54:35", "remaining_time": "1 day, 2:29:17", "throughput": 332.07, "total_tokens": 19019264} {"current_steps": 15015, "total_steps": 40000, "loss": 0.0818, "lr": 0.2072501013944027, "epoch": 0.7336378960740723, "percentage": 37.54, "elapsed_time": "15:54:38", "remaining_time": "1 day, 2:28:31", "throughput": 332.16, "total_tokens": 19025568} {"current_steps": 15020, "total_steps": 40000, "loss": 0.0673, "lr": 0.20719565123163017, "epoch": 0.7338821977377666, "percentage": 37.55, "elapsed_time": "15:54:41", "remaining_time": "1 day, 2:27:45", "throughput": 332.25, "total_tokens": 19031776} {"current_steps": 15025, "total_steps": 40000, "loss": 0.0704, "lr": 0.20714119224856944, "epoch": 0.7341264994014609, "percentage": 37.56, "elapsed_time": "15:54:44", "remaining_time": "1 day, 2:27:00", "throughput": 332.34, "total_tokens": 19038048} {"current_steps": 15030, "total_steps": 40000, "loss": 0.0619, "lr": 0.2070867244536188, "epoch": 0.7343708010651553, "percentage": 37.57, "elapsed_time": "15:54:47", "remaining_time": "1 day, 2:26:14", "throughput": 332.43, "total_tokens": 19044256} {"current_steps": 15035, "total_steps": 40000, "loss": 0.0552, "lr": 0.20703224785517785, "epoch": 0.7346151027288496, "percentage": 37.59, "elapsed_time": "15:54:50", "remaining_time": "1 day, 2:25:29", "throughput": 332.52, "total_tokens": 19050560} {"current_steps": 15040, "total_steps": 40000, "loss": 0.096, "lr": 0.20697776246164754, "epoch": 0.7348594043925439, "percentage": 37.6, "elapsed_time": "15:54:53", "remaining_time": "1 day, 2:24:43", "throughput": 332.61, "total_tokens": 19056768} {"current_steps": 15045, "total_steps": 40000, "loss": 0.0687, "lr": 0.2069232682814303, "epoch": 0.7351037060562382, "percentage": 37.61, "elapsed_time": "15:54:57", "remaining_time": "1 day, 2:23:58", "throughput": 332.71, "total_tokens": 19063328} {"current_steps": 15050, "total_steps": 40000, "loss": 0.0549, "lr": 0.20686876532292972, "epoch": 0.7353480077199326, "percentage": 37.62, "elapsed_time": "15:55:00", "remaining_time": "1 day, 2:23:12", "throughput": 332.81, "total_tokens": 19070144} {"current_steps": 15055, "total_steps": 40000, "loss": 0.0864, "lr": 0.20681425359455083, "epoch": 0.7355923093836269, "percentage": 37.64, "elapsed_time": "15:55:03", "remaining_time": "1 day, 2:22:27", "throughput": 332.9, "total_tokens": 19076544} {"current_steps": 15060, "total_steps": 40000, "loss": 0.0666, "lr": 0.20675973310470008, "epoch": 0.7358366110473212, "percentage": 37.65, "elapsed_time": "15:55:06", "remaining_time": "1 day, 2:21:41", "throughput": 333.0, "total_tokens": 19083040} {"current_steps": 15065, "total_steps": 40000, "loss": 0.0574, "lr": 0.2067052038617852, "epoch": 0.7360809127110156, "percentage": 37.66, "elapsed_time": "15:55:09", "remaining_time": "1 day, 2:20:56", "throughput": 333.09, "total_tokens": 19089024} {"current_steps": 15070, "total_steps": 40000, "loss": 0.0467, "lr": 0.2066506658742153, "epoch": 0.7363252143747099, "percentage": 37.67, "elapsed_time": "15:55:12", "remaining_time": "1 day, 2:20:11", "throughput": 333.19, "total_tokens": 19095744} {"current_steps": 15075, "total_steps": 40000, "loss": 0.0574, "lr": 0.20659611915040077, "epoch": 0.7365695160384043, "percentage": 37.69, "elapsed_time": "15:55:15", "remaining_time": "1 day, 2:19:25", "throughput": 333.27, "total_tokens": 19101728} {"current_steps": 15080, "total_steps": 40000, "loss": 0.0632, "lr": 0.20654156369875348, "epoch": 0.7368138177020985, "percentage": 37.7, "elapsed_time": "15:55:18", "remaining_time": "1 day, 2:18:40", "throughput": 333.36, "total_tokens": 19107712} {"current_steps": 15085, "total_steps": 40000, "loss": 0.0434, "lr": 0.20648699952768648, "epoch": 0.7370581193657929, "percentage": 37.71, "elapsed_time": "15:55:21", "remaining_time": "1 day, 2:17:55", "throughput": 333.45, "total_tokens": 19113952} {"current_steps": 15090, "total_steps": 40000, "loss": 0.0803, "lr": 0.20643242664561437, "epoch": 0.7373024210294872, "percentage": 37.72, "elapsed_time": "15:55:25", "remaining_time": "1 day, 2:17:10", "throughput": 333.55, "total_tokens": 19120832} {"current_steps": 15095, "total_steps": 40000, "loss": 0.0789, "lr": 0.20637784506095277, "epoch": 0.7375467226931816, "percentage": 37.74, "elapsed_time": "15:55:28", "remaining_time": "1 day, 2:16:24", "throughput": 333.64, "total_tokens": 19127040} {"current_steps": 15100, "total_steps": 40000, "loss": 0.0538, "lr": 0.20632325478211908, "epoch": 0.7377910243568758, "percentage": 37.75, "elapsed_time": "15:55:31", "remaining_time": "1 day, 2:15:39", "throughput": 333.74, "total_tokens": 19133600} {"current_steps": 15105, "total_steps": 40000, "loss": 0.064, "lr": 0.20626865581753165, "epoch": 0.7380353260205702, "percentage": 37.76, "elapsed_time": "15:55:34", "remaining_time": "1 day, 2:14:54", "throughput": 333.83, "total_tokens": 19140000} {"current_steps": 15110, "total_steps": 40000, "loss": 0.0664, "lr": 0.2062140481756104, "epoch": 0.7382796276842646, "percentage": 37.77, "elapsed_time": "15:55:37", "remaining_time": "1 day, 2:14:09", "throughput": 333.92, "total_tokens": 19146048} {"current_steps": 15115, "total_steps": 40000, "loss": 0.0504, "lr": 0.20615943186477648, "epoch": 0.7385239293479589, "percentage": 37.79, "elapsed_time": "15:55:40", "remaining_time": "1 day, 2:13:24", "throughput": 334.01, "total_tokens": 19152224} {"current_steps": 15120, "total_steps": 40000, "loss": 0.049, "lr": 0.20610480689345242, "epoch": 0.7387682310116532, "percentage": 37.8, "elapsed_time": "15:55:43", "remaining_time": "1 day, 2:12:38", "throughput": 334.1, "total_tokens": 19158400} {"current_steps": 15125, "total_steps": 40000, "loss": 0.079, "lr": 0.2060501732700621, "epoch": 0.7390125326753475, "percentage": 37.81, "elapsed_time": "15:55:46", "remaining_time": "1 day, 2:11:53", "throughput": 334.19, "total_tokens": 19164672} {"current_steps": 15130, "total_steps": 40000, "loss": 0.0353, "lr": 0.20599553100303067, "epoch": 0.7392568343390419, "percentage": 37.82, "elapsed_time": "15:55:49", "remaining_time": "1 day, 2:11:08", "throughput": 334.29, "total_tokens": 19171360} {"current_steps": 15135, "total_steps": 40000, "loss": 0.0321, "lr": 0.20594088010078465, "epoch": 0.7395011360027361, "percentage": 37.84, "elapsed_time": "15:55:52", "remaining_time": "1 day, 2:10:23", "throughput": 334.38, "total_tokens": 19177664} {"current_steps": 15140, "total_steps": 40000, "loss": 0.0704, "lr": 0.20588622057175196, "epoch": 0.7397454376664305, "percentage": 37.85, "elapsed_time": "15:55:56", "remaining_time": "1 day, 2:09:39", "throughput": 334.49, "total_tokens": 19184896} {"current_steps": 15145, "total_steps": 40000, "loss": 0.0568, "lr": 0.20583155242436177, "epoch": 0.7399897393301248, "percentage": 37.86, "elapsed_time": "15:55:59", "remaining_time": "1 day, 2:08:54", "throughput": 334.57, "total_tokens": 19190912} {"current_steps": 15150, "total_steps": 40000, "loss": 0.0971, "lr": 0.20577687566704453, "epoch": 0.7402340409938192, "percentage": 37.88, "elapsed_time": "15:56:02", "remaining_time": "1 day, 2:08:09", "throughput": 334.67, "total_tokens": 19197312} {"current_steps": 15155, "total_steps": 40000, "loss": 0.0544, "lr": 0.20572219030823213, "epoch": 0.7404783426575134, "percentage": 37.89, "elapsed_time": "15:56:05", "remaining_time": "1 day, 2:07:24", "throughput": 334.77, "total_tokens": 19204160} {"current_steps": 15160, "total_steps": 40000, "loss": 0.0517, "lr": 0.20566749635635775, "epoch": 0.7407226443212078, "percentage": 37.9, "elapsed_time": "15:56:08", "remaining_time": "1 day, 2:06:39", "throughput": 334.86, "total_tokens": 19210144} {"current_steps": 15165, "total_steps": 40000, "loss": 0.0995, "lr": 0.20561279381985587, "epoch": 0.7409669459849022, "percentage": 37.91, "elapsed_time": "15:56:11", "remaining_time": "1 day, 2:05:54", "throughput": 334.95, "total_tokens": 19216384} {"current_steps": 15170, "total_steps": 40000, "loss": 0.0524, "lr": 0.2055580827071623, "epoch": 0.7412112476485965, "percentage": 37.92, "elapsed_time": "15:56:14", "remaining_time": "1 day, 2:05:09", "throughput": 335.03, "total_tokens": 19222432} {"current_steps": 15175, "total_steps": 40000, "loss": 0.0879, "lr": 0.20550336302671418, "epoch": 0.7414555493122909, "percentage": 37.94, "elapsed_time": "15:56:17", "remaining_time": "1 day, 2:04:24", "throughput": 335.12, "total_tokens": 19228512} {"current_steps": 15180, "total_steps": 40000, "loss": 0.0877, "lr": 0.20544863478695, "epoch": 0.7416998509759851, "percentage": 37.95, "elapsed_time": "15:56:20", "remaining_time": "1 day, 2:03:40", "throughput": 335.22, "total_tokens": 19235136} {"current_steps": 15185, "total_steps": 40000, "loss": 0.0685, "lr": 0.20539389799630953, "epoch": 0.7419441526396795, "percentage": 37.96, "elapsed_time": "15:56:23", "remaining_time": "1 day, 2:02:55", "throughput": 335.32, "total_tokens": 19241760} {"current_steps": 15190, "total_steps": 40000, "loss": 0.044, "lr": 0.20533915266323388, "epoch": 0.7421884543033738, "percentage": 37.97, "elapsed_time": "15:56:27", "remaining_time": "1 day, 2:02:10", "throughput": 335.41, "total_tokens": 19248128} {"current_steps": 15195, "total_steps": 40000, "loss": 0.0477, "lr": 0.20528439879616542, "epoch": 0.7424327559670681, "percentage": 37.99, "elapsed_time": "15:56:30", "remaining_time": "1 day, 2:01:26", "throughput": 335.5, "total_tokens": 19254240} {"current_steps": 15200, "total_steps": 40000, "loss": 0.0631, "lr": 0.20522963640354794, "epoch": 0.7426770576307624, "percentage": 38.0, "elapsed_time": "15:56:33", "remaining_time": "1 day, 2:00:41", "throughput": 335.59, "total_tokens": 19260320} {"current_steps": 15200, "total_steps": 40000, "eval_loss": 0.0679754987359047, "epoch": 0.7426770576307624, "percentage": 38.0, "elapsed_time": "16:07:13", "remaining_time": "1 day, 2:18:05", "throughput": 331.88, "total_tokens": 19260320} {"current_steps": 15205, "total_steps": 40000, "loss": 0.1135, "lr": 0.20517486549382644, "epoch": 0.7429213592944568, "percentage": 38.01, "elapsed_time": "16:07:16", "remaining_time": "1 day, 2:17:21", "throughput": 331.97, "total_tokens": 19266816} {"current_steps": 15210, "total_steps": 40000, "loss": 0.0924, "lr": 0.20512008607544735, "epoch": 0.7431656609581512, "percentage": 38.02, "elapsed_time": "16:07:19", "remaining_time": "1 day, 2:16:36", "throughput": 332.06, "total_tokens": 19272768} {"current_steps": 15215, "total_steps": 40000, "loss": 0.0456, "lr": 0.20506529815685826, "epoch": 0.7434099626218454, "percentage": 38.04, "elapsed_time": "16:07:23", "remaining_time": "1 day, 2:15:51", "throughput": 332.15, "total_tokens": 19279168} {"current_steps": 15220, "total_steps": 40000, "loss": 0.0481, "lr": 0.2050105017465082, "epoch": 0.7436542642855398, "percentage": 38.05, "elapsed_time": "16:07:26", "remaining_time": "1 day, 2:15:06", "throughput": 332.25, "total_tokens": 19285632} {"current_steps": 15225, "total_steps": 40000, "loss": 0.0874, "lr": 0.20495569685284754, "epoch": 0.7438985659492341, "percentage": 38.06, "elapsed_time": "16:07:29", "remaining_time": "1 day, 2:14:21", "throughput": 332.34, "total_tokens": 19291968} {"current_steps": 15230, "total_steps": 40000, "loss": 0.0397, "lr": 0.20490088348432778, "epoch": 0.7441428676129285, "percentage": 38.07, "elapsed_time": "16:07:32", "remaining_time": "1 day, 2:13:36", "throughput": 332.43, "total_tokens": 19298464} {"current_steps": 15235, "total_steps": 40000, "loss": 0.0722, "lr": 0.2048460616494018, "epoch": 0.7443871692766227, "percentage": 38.09, "elapsed_time": "16:07:35", "remaining_time": "1 day, 2:12:50", "throughput": 332.52, "total_tokens": 19304416} {"current_steps": 15240, "total_steps": 40000, "loss": 0.0474, "lr": 0.2047912313565239, "epoch": 0.7446314709403171, "percentage": 38.1, "elapsed_time": "16:07:38", "remaining_time": "1 day, 2:12:05", "throughput": 332.6, "total_tokens": 19310304} {"current_steps": 15245, "total_steps": 40000, "loss": 0.0717, "lr": 0.20473639261414958, "epoch": 0.7448757726040114, "percentage": 38.11, "elapsed_time": "16:07:41", "remaining_time": "1 day, 2:11:21", "throughput": 332.7, "total_tokens": 19317344} {"current_steps": 15250, "total_steps": 40000, "loss": 0.0722, "lr": 0.2046815454307357, "epoch": 0.7451200742677058, "percentage": 38.12, "elapsed_time": "16:07:44", "remaining_time": "1 day, 2:10:36", "throughput": 332.8, "total_tokens": 19323904} {"current_steps": 15255, "total_steps": 40000, "loss": 0.0917, "lr": 0.20462668981474028, "epoch": 0.7453643759314001, "percentage": 38.14, "elapsed_time": "16:07:47", "remaining_time": "1 day, 2:09:51", "throughput": 332.89, "total_tokens": 19329920} {"current_steps": 15260, "total_steps": 40000, "loss": 0.0749, "lr": 0.20457182577462288, "epoch": 0.7456086775950944, "percentage": 38.15, "elapsed_time": "16:07:51", "remaining_time": "1 day, 2:09:06", "throughput": 332.98, "total_tokens": 19336544} {"current_steps": 15265, "total_steps": 40000, "loss": 0.0635, "lr": 0.2045169533188441, "epoch": 0.7458529792587888, "percentage": 38.16, "elapsed_time": "16:07:54", "remaining_time": "1 day, 2:08:21", "throughput": 333.07, "total_tokens": 19342880} {"current_steps": 15270, "total_steps": 40000, "loss": 0.0644, "lr": 0.20446207245586603, "epoch": 0.7460972809224831, "percentage": 38.17, "elapsed_time": "16:07:57", "remaining_time": "1 day, 2:07:36", "throughput": 333.16, "total_tokens": 19348800} {"current_steps": 15275, "total_steps": 40000, "loss": 0.0629, "lr": 0.20440718319415196, "epoch": 0.7463415825861774, "percentage": 38.19, "elapsed_time": "16:08:00", "remaining_time": "1 day, 2:06:51", "throughput": 333.24, "total_tokens": 19354784} {"current_steps": 15280, "total_steps": 40000, "loss": 0.0669, "lr": 0.20435228554216653, "epoch": 0.7465858842498717, "percentage": 38.2, "elapsed_time": "16:08:03", "remaining_time": "1 day, 2:06:07", "throughput": 333.34, "total_tokens": 19361408} {"current_steps": 15285, "total_steps": 40000, "loss": 0.0483, "lr": 0.20429737950837565, "epoch": 0.7468301859135661, "percentage": 38.21, "elapsed_time": "16:08:06", "remaining_time": "1 day, 2:05:22", "throughput": 333.44, "total_tokens": 19368192} {"current_steps": 15290, "total_steps": 40000, "loss": 0.0663, "lr": 0.20424246510124647, "epoch": 0.7470744875772604, "percentage": 38.22, "elapsed_time": "16:08:09", "remaining_time": "1 day, 2:04:38", "throughput": 333.54, "total_tokens": 19374976} {"current_steps": 15295, "total_steps": 40000, "loss": 0.0311, "lr": 0.20418754232924755, "epoch": 0.7473187892409547, "percentage": 38.24, "elapsed_time": "16:08:12", "remaining_time": "1 day, 2:03:53", "throughput": 333.63, "total_tokens": 19381792} {"current_steps": 15300, "total_steps": 40000, "loss": 0.0619, "lr": 0.20413261120084863, "epoch": 0.747563090904649, "percentage": 38.25, "elapsed_time": "16:08:15", "remaining_time": "1 day, 2:03:08", "throughput": 333.73, "total_tokens": 19388384} {"current_steps": 15305, "total_steps": 40000, "loss": 0.0381, "lr": 0.2040776717245208, "epoch": 0.7478073925683434, "percentage": 38.26, "elapsed_time": "16:08:18", "remaining_time": "1 day, 2:02:24", "throughput": 333.81, "total_tokens": 19394240} {"current_steps": 15310, "total_steps": 40000, "loss": 0.0457, "lr": 0.2040227239087364, "epoch": 0.7480516942320378, "percentage": 38.27, "elapsed_time": "16:08:22", "remaining_time": "1 day, 2:01:39", "throughput": 333.91, "total_tokens": 19400704} {"current_steps": 15315, "total_steps": 40000, "loss": 0.0791, "lr": 0.20396776776196904, "epoch": 0.748295995895732, "percentage": 38.29, "elapsed_time": "16:08:25", "remaining_time": "1 day, 2:00:54", "throughput": 333.99, "total_tokens": 19406752} {"current_steps": 15320, "total_steps": 40000, "loss": 0.058, "lr": 0.20391280329269373, "epoch": 0.7485402975594264, "percentage": 38.3, "elapsed_time": "16:08:28", "remaining_time": "1 day, 2:00:10", "throughput": 334.08, "total_tokens": 19412928} {"current_steps": 15325, "total_steps": 40000, "loss": 0.0708, "lr": 0.20385783050938663, "epoch": 0.7487845992231207, "percentage": 38.31, "elapsed_time": "16:08:31", "remaining_time": "1 day, 1:59:25", "throughput": 334.18, "total_tokens": 19419552} {"current_steps": 15330, "total_steps": 40000, "loss": 0.0681, "lr": 0.20380284942052526, "epoch": 0.7490289008868151, "percentage": 38.32, "elapsed_time": "16:08:34", "remaining_time": "1 day, 1:58:41", "throughput": 334.26, "total_tokens": 19425408} {"current_steps": 15335, "total_steps": 40000, "loss": 0.0578, "lr": 0.2037478600345884, "epoch": 0.7492732025505093, "percentage": 38.34, "elapsed_time": "16:08:37", "remaining_time": "1 day, 1:57:56", "throughput": 334.35, "total_tokens": 19431552} {"current_steps": 15340, "total_steps": 40000, "loss": 0.0545, "lr": 0.20369286236005604, "epoch": 0.7495175042142037, "percentage": 38.35, "elapsed_time": "16:08:40", "remaining_time": "1 day, 1:57:12", "throughput": 334.44, "total_tokens": 19437760} {"current_steps": 15345, "total_steps": 40000, "loss": 0.0875, "lr": 0.20363785640540957, "epoch": 0.749761805877898, "percentage": 38.36, "elapsed_time": "16:08:43", "remaining_time": "1 day, 1:56:27", "throughput": 334.52, "total_tokens": 19443200} {"current_steps": 15350, "total_steps": 40000, "loss": 0.0781, "lr": 0.2035828421791316, "epoch": 0.7500061075415924, "percentage": 38.38, "elapsed_time": "16:08:46", "remaining_time": "1 day, 1:55:43", "throughput": 334.61, "total_tokens": 19449792} {"current_steps": 15355, "total_steps": 40000, "loss": 0.0765, "lr": 0.20352781968970599, "epoch": 0.7502504092052867, "percentage": 38.39, "elapsed_time": "16:08:49", "remaining_time": "1 day, 1:54:59", "throughput": 334.71, "total_tokens": 19456512} {"current_steps": 15360, "total_steps": 40000, "loss": 0.0993, "lr": 0.2034727889456179, "epoch": 0.750494710868981, "percentage": 38.4, "elapsed_time": "16:08:52", "remaining_time": "1 day, 1:54:14", "throughput": 334.8, "total_tokens": 19462912} {"current_steps": 15365, "total_steps": 40000, "loss": 0.0675, "lr": 0.2034177499553538, "epoch": 0.7507390125326754, "percentage": 38.41, "elapsed_time": "16:08:55", "remaining_time": "1 day, 1:53:30", "throughput": 334.89, "total_tokens": 19469024} {"current_steps": 15370, "total_steps": 40000, "loss": 0.0641, "lr": 0.2033627027274014, "epoch": 0.7509833141963697, "percentage": 38.42, "elapsed_time": "16:08:58", "remaining_time": "1 day, 1:52:45", "throughput": 334.98, "total_tokens": 19475424} {"current_steps": 15375, "total_steps": 40000, "loss": 0.0483, "lr": 0.20330764727024955, "epoch": 0.751227615860064, "percentage": 38.44, "elapsed_time": "16:09:01", "remaining_time": "1 day, 1:52:01", "throughput": 335.07, "total_tokens": 19481760} {"current_steps": 15380, "total_steps": 40000, "loss": 0.088, "lr": 0.20325258359238868, "epoch": 0.7514719175237583, "percentage": 38.45, "elapsed_time": "16:09:05", "remaining_time": "1 day, 1:51:17", "throughput": 335.16, "total_tokens": 19488032} {"current_steps": 15385, "total_steps": 40000, "loss": 0.0549, "lr": 0.20319751170231018, "epoch": 0.7517162191874527, "percentage": 38.46, "elapsed_time": "16:09:08", "remaining_time": "1 day, 1:50:33", "throughput": 335.27, "total_tokens": 19495584} {"current_steps": 15390, "total_steps": 40000, "loss": 0.0777, "lr": 0.2031424316085068, "epoch": 0.751960520851147, "percentage": 38.48, "elapsed_time": "16:09:11", "remaining_time": "1 day, 1:49:49", "throughput": 335.37, "total_tokens": 19502272} {"current_steps": 15395, "total_steps": 40000, "loss": 0.0714, "lr": 0.20308734331947265, "epoch": 0.7522048225148413, "percentage": 38.49, "elapsed_time": "16:09:14", "remaining_time": "1 day, 1:49:05", "throughput": 335.46, "total_tokens": 19508736} {"current_steps": 15400, "total_steps": 40000, "loss": 0.07, "lr": 0.20303224684370305, "epoch": 0.7524491241785357, "percentage": 38.5, "elapsed_time": "16:09:17", "remaining_time": "1 day, 1:48:21", "throughput": 335.55, "total_tokens": 19514944} {"current_steps": 15400, "total_steps": 40000, "eval_loss": 0.06788071244955063, "epoch": 0.7524491241785357, "percentage": 38.5, "elapsed_time": "16:19:57", "remaining_time": "1 day, 2:05:23", "throughput": 331.9, "total_tokens": 19514944} {"current_steps": 15405, "total_steps": 40000, "loss": 0.0556, "lr": 0.20297714218969456, "epoch": 0.75269342584223, "percentage": 38.51, "elapsed_time": "16:20:01", "remaining_time": "1 day, 2:04:40", "throughput": 331.98, "total_tokens": 19521120} {"current_steps": 15410, "total_steps": 40000, "loss": 0.0387, "lr": 0.20292202936594497, "epoch": 0.7529377275059244, "percentage": 38.52, "elapsed_time": "16:20:04", "remaining_time": "1 day, 2:03:55", "throughput": 332.07, "total_tokens": 19527328} {"current_steps": 15415, "total_steps": 40000, "loss": 0.0564, "lr": 0.2028669083809534, "epoch": 0.7531820291696186, "percentage": 38.54, "elapsed_time": "16:20:07", "remaining_time": "1 day, 2:03:11", "throughput": 332.17, "total_tokens": 19533984} {"current_steps": 15420, "total_steps": 40000, "loss": 0.0569, "lr": 0.20281177924322016, "epoch": 0.753426330833313, "percentage": 38.55, "elapsed_time": "16:20:11", "remaining_time": "1 day, 2:02:26", "throughput": 332.26, "total_tokens": 19540480} {"current_steps": 15425, "total_steps": 40000, "loss": 0.0416, "lr": 0.2027566419612469, "epoch": 0.7536706324970073, "percentage": 38.56, "elapsed_time": "16:20:14", "remaining_time": "1 day, 2:01:42", "throughput": 332.35, "total_tokens": 19547232} {"current_steps": 15430, "total_steps": 40000, "loss": 0.0901, "lr": 0.20270149654353647, "epoch": 0.7539149341607017, "percentage": 38.57, "elapsed_time": "16:20:17", "remaining_time": "1 day, 2:00:57", "throughput": 332.44, "total_tokens": 19553216} {"current_steps": 15435, "total_steps": 40000, "loss": 0.0464, "lr": 0.202646342998593, "epoch": 0.7541592358243959, "percentage": 38.59, "elapsed_time": "16:20:20", "remaining_time": "1 day, 2:00:13", "throughput": 332.53, "total_tokens": 19559584} {"current_steps": 15440, "total_steps": 40000, "loss": 0.0664, "lr": 0.20259118133492185, "epoch": 0.7544035374880903, "percentage": 38.6, "elapsed_time": "16:20:23", "remaining_time": "1 day, 1:59:29", "throughput": 332.62, "total_tokens": 19565728} {"current_steps": 15445, "total_steps": 40000, "loss": 0.0856, "lr": 0.20253601156102966, "epoch": 0.7546478391517846, "percentage": 38.61, "elapsed_time": "16:20:26", "remaining_time": "1 day, 1:58:44", "throughput": 332.71, "total_tokens": 19572448} {"current_steps": 15450, "total_steps": 40000, "loss": 0.0657, "lr": 0.20248083368542422, "epoch": 0.754892140815479, "percentage": 38.62, "elapsed_time": "16:20:29", "remaining_time": "1 day, 1:58:00", "throughput": 332.8, "total_tokens": 19578464} {"current_steps": 15455, "total_steps": 40000, "loss": 0.066, "lr": 0.2024256477166147, "epoch": 0.7551364424791733, "percentage": 38.64, "elapsed_time": "16:20:32", "remaining_time": "1 day, 1:57:15", "throughput": 332.89, "total_tokens": 19584544} {"current_steps": 15460, "total_steps": 40000, "loss": 0.1118, "lr": 0.2023704536631115, "epoch": 0.7553807441428676, "percentage": 38.65, "elapsed_time": "16:20:35", "remaining_time": "1 day, 1:56:31", "throughput": 332.98, "total_tokens": 19590848} {"current_steps": 15465, "total_steps": 40000, "loss": 0.089, "lr": 0.20231525153342625, "epoch": 0.755625045806562, "percentage": 38.66, "elapsed_time": "16:20:38", "remaining_time": "1 day, 1:55:46", "throughput": 333.06, "total_tokens": 19596864} {"current_steps": 15470, "total_steps": 40000, "loss": 0.0604, "lr": 0.20226004133607173, "epoch": 0.7558693474702562, "percentage": 38.67, "elapsed_time": "16:20:41", "remaining_time": "1 day, 1:55:02", "throughput": 333.15, "total_tokens": 19603168} {"current_steps": 15475, "total_steps": 40000, "loss": 0.0642, "lr": 0.20220482307956214, "epoch": 0.7561136491339506, "percentage": 38.69, "elapsed_time": "16:20:44", "remaining_time": "1 day, 1:54:18", "throughput": 333.24, "total_tokens": 19609536} {"current_steps": 15480, "total_steps": 40000, "loss": 0.0533, "lr": 0.20214959677241276, "epoch": 0.7563579507976449, "percentage": 38.7, "elapsed_time": "16:20:48", "remaining_time": "1 day, 1:53:34", "throughput": 333.33, "total_tokens": 19615808} {"current_steps": 15485, "total_steps": 40000, "loss": 0.0568, "lr": 0.20209436242314022, "epoch": 0.7566022524613393, "percentage": 38.71, "elapsed_time": "16:20:51", "remaining_time": "1 day, 1:52:49", "throughput": 333.43, "total_tokens": 19622464} {"current_steps": 15490, "total_steps": 40000, "loss": 0.062, "lr": 0.2020391200402623, "epoch": 0.7568465541250335, "percentage": 38.73, "elapsed_time": "16:20:54", "remaining_time": "1 day, 1:52:05", "throughput": 333.51, "total_tokens": 19628320} {"current_steps": 15495, "total_steps": 40000, "loss": 0.0821, "lr": 0.2019838696322981, "epoch": 0.7570908557887279, "percentage": 38.74, "elapsed_time": "16:20:57", "remaining_time": "1 day, 1:51:21", "throughput": 333.6, "total_tokens": 19634624} {"current_steps": 15500, "total_steps": 40000, "loss": 0.0487, "lr": 0.20192861120776798, "epoch": 0.7573351574524223, "percentage": 38.75, "elapsed_time": "16:21:00", "remaining_time": "1 day, 1:50:37", "throughput": 333.68, "total_tokens": 19640352} {"current_steps": 15505, "total_steps": 40000, "loss": 0.0579, "lr": 0.20187334477519345, "epoch": 0.7575794591161166, "percentage": 38.76, "elapsed_time": "16:21:03", "remaining_time": "1 day, 1:49:52", "throughput": 333.77, "total_tokens": 19646688} {"current_steps": 15510, "total_steps": 40000, "loss": 0.0505, "lr": 0.20181807034309726, "epoch": 0.757823760779811, "percentage": 38.77, "elapsed_time": "16:21:06", "remaining_time": "1 day, 1:49:08", "throughput": 333.86, "total_tokens": 19653024} {"current_steps": 15515, "total_steps": 40000, "loss": 0.0485, "lr": 0.2017627879200034, "epoch": 0.7580680624435052, "percentage": 38.79, "elapsed_time": "16:21:09", "remaining_time": "1 day, 1:48:24", "throughput": 333.95, "total_tokens": 19659584} {"current_steps": 15520, "total_steps": 40000, "loss": 0.0504, "lr": 0.2017074975144372, "epoch": 0.7583123641071996, "percentage": 38.8, "elapsed_time": "16:21:12", "remaining_time": "1 day, 1:47:40", "throughput": 334.04, "total_tokens": 19665600} {"current_steps": 15525, "total_steps": 40000, "loss": 0.0852, "lr": 0.20165219913492508, "epoch": 0.7585566657708939, "percentage": 38.81, "elapsed_time": "16:21:15", "remaining_time": "1 day, 1:46:56", "throughput": 334.13, "total_tokens": 19671840} {"current_steps": 15530, "total_steps": 40000, "loss": 0.0468, "lr": 0.20159689278999468, "epoch": 0.7588009674345882, "percentage": 38.82, "elapsed_time": "16:21:18", "remaining_time": "1 day, 1:46:12", "throughput": 334.21, "total_tokens": 19677952} {"current_steps": 15535, "total_steps": 40000, "loss": 0.0512, "lr": 0.20154157848817508, "epoch": 0.7590452690982825, "percentage": 38.84, "elapsed_time": "16:21:21", "remaining_time": "1 day, 1:45:28", "throughput": 334.3, "total_tokens": 19684032} {"current_steps": 15540, "total_steps": 40000, "loss": 0.1091, "lr": 0.20148625623799632, "epoch": 0.7592895707619769, "percentage": 38.85, "elapsed_time": "16:21:24", "remaining_time": "1 day, 1:44:44", "throughput": 334.38, "total_tokens": 19689888} {"current_steps": 15545, "total_steps": 40000, "loss": 0.0709, "lr": 0.20143092604798984, "epoch": 0.7595338724256712, "percentage": 38.86, "elapsed_time": "16:21:27", "remaining_time": "1 day, 1:44:00", "throughput": 334.48, "total_tokens": 19696480} {"current_steps": 15550, "total_steps": 40000, "loss": 0.0686, "lr": 0.2013755879266883, "epoch": 0.7597781740893655, "percentage": 38.88, "elapsed_time": "16:21:30", "remaining_time": "1 day, 1:43:17", "throughput": 334.57, "total_tokens": 19703296} {"current_steps": 15555, "total_steps": 40000, "loss": 0.0804, "lr": 0.20132024188262543, "epoch": 0.7600224757530599, "percentage": 38.89, "elapsed_time": "16:21:33", "remaining_time": "1 day, 1:42:33", "throughput": 334.66, "total_tokens": 19709472} {"current_steps": 15560, "total_steps": 40000, "loss": 0.0641, "lr": 0.2012648879243363, "epoch": 0.7602667774167542, "percentage": 38.9, "elapsed_time": "16:21:36", "remaining_time": "1 day, 1:41:49", "throughput": 334.75, "total_tokens": 19715488} {"current_steps": 15565, "total_steps": 40000, "loss": 0.0614, "lr": 0.20120952606035725, "epoch": 0.7605110790804486, "percentage": 38.91, "elapsed_time": "16:21:40", "remaining_time": "1 day, 1:41:05", "throughput": 334.84, "total_tokens": 19722336} {"current_steps": 15570, "total_steps": 40000, "loss": 0.0786, "lr": 0.20115415629922576, "epoch": 0.7607553807441428, "percentage": 38.92, "elapsed_time": "16:21:43", "remaining_time": "1 day, 1:40:21", "throughput": 334.93, "total_tokens": 19728512} {"current_steps": 15575, "total_steps": 40000, "loss": 0.0676, "lr": 0.20109877864948048, "epoch": 0.7609996824078372, "percentage": 38.94, "elapsed_time": "16:21:46", "remaining_time": "1 day, 1:39:37", "throughput": 335.02, "total_tokens": 19735040} {"current_steps": 15580, "total_steps": 40000, "loss": 0.0525, "lr": 0.20104339311966138, "epoch": 0.7612439840715315, "percentage": 38.95, "elapsed_time": "16:21:49", "remaining_time": "1 day, 1:38:54", "throughput": 335.11, "total_tokens": 19741216} {"current_steps": 15585, "total_steps": 40000, "loss": 0.0566, "lr": 0.2009879997183097, "epoch": 0.7614882857352259, "percentage": 38.96, "elapsed_time": "16:21:52", "remaining_time": "1 day, 1:38:10", "throughput": 335.21, "total_tokens": 19748320} {"current_steps": 15590, "total_steps": 40000, "loss": 0.0532, "lr": 0.20093259845396763, "epoch": 0.7617325873989201, "percentage": 38.98, "elapsed_time": "16:21:55", "remaining_time": "1 day, 1:37:27", "throughput": 335.3, "total_tokens": 19754720} {"current_steps": 15595, "total_steps": 40000, "loss": 0.0659, "lr": 0.20087718933517884, "epoch": 0.7619768890626145, "percentage": 38.99, "elapsed_time": "16:21:58", "remaining_time": "1 day, 1:36:43", "throughput": 335.39, "total_tokens": 19760704} {"current_steps": 15600, "total_steps": 40000, "loss": 0.0913, "lr": 0.20082177237048807, "epoch": 0.7622211907263089, "percentage": 39.0, "elapsed_time": "16:22:01", "remaining_time": "1 day, 1:35:59", "throughput": 335.48, "total_tokens": 19766912} {"current_steps": 15600, "total_steps": 40000, "eval_loss": 0.06753074377775192, "epoch": 0.7622211907263089, "percentage": 39.0, "elapsed_time": "16:32:41", "remaining_time": "1 day, 1:52:41", "throughput": 331.87, "total_tokens": 19766912} {"current_steps": 15605, "total_steps": 40000, "loss": 0.0587, "lr": 0.20076634756844133, "epoch": 0.7624654923900032, "percentage": 39.01, "elapsed_time": "16:32:46", "remaining_time": "1 day, 1:51:59", "throughput": 331.96, "total_tokens": 19773504} {"current_steps": 15610, "total_steps": 40000, "loss": 0.0728, "lr": 0.20071091493758586, "epoch": 0.7627097940536975, "percentage": 39.02, "elapsed_time": "16:32:49", "remaining_time": "1 day, 1:51:15", "throughput": 332.04, "total_tokens": 19779648} {"current_steps": 15615, "total_steps": 40000, "loss": 0.0605, "lr": 0.20065547448647003, "epoch": 0.7629540957173918, "percentage": 39.04, "elapsed_time": "16:32:52", "remaining_time": "1 day, 1:50:31", "throughput": 332.13, "total_tokens": 19786080} {"current_steps": 15620, "total_steps": 40000, "loss": 0.0768, "lr": 0.20060002622364348, "epoch": 0.7631983973810862, "percentage": 39.05, "elapsed_time": "16:32:55", "remaining_time": "1 day, 1:49:47", "throughput": 332.23, "total_tokens": 19792736} {"current_steps": 15625, "total_steps": 40000, "loss": 0.0443, "lr": 0.20054457015765695, "epoch": 0.7634426990447805, "percentage": 39.06, "elapsed_time": "16:32:58", "remaining_time": "1 day, 1:49:03", "throughput": 332.31, "total_tokens": 19798816} {"current_steps": 15630, "total_steps": 40000, "loss": 0.0592, "lr": 0.20048910629706254, "epoch": 0.7636870007084748, "percentage": 39.07, "elapsed_time": "16:33:02", "remaining_time": "1 day, 1:48:19", "throughput": 332.4, "total_tokens": 19804992} {"current_steps": 15635, "total_steps": 40000, "loss": 0.0744, "lr": 0.20043363465041347, "epoch": 0.7639313023721691, "percentage": 39.09, "elapsed_time": "16:33:05", "remaining_time": "1 day, 1:47:35", "throughput": 332.49, "total_tokens": 19811232} {"current_steps": 15640, "total_steps": 40000, "loss": 0.0524, "lr": 0.2003781552262641, "epoch": 0.7641756040358635, "percentage": 39.1, "elapsed_time": "16:33:08", "remaining_time": "1 day, 1:46:51", "throughput": 332.57, "total_tokens": 19817504} {"current_steps": 15645, "total_steps": 40000, "loss": 0.0571, "lr": 0.20032266803317014, "epoch": 0.7644199056995579, "percentage": 39.11, "elapsed_time": "16:33:11", "remaining_time": "1 day, 1:46:07", "throughput": 332.66, "total_tokens": 19823552} {"current_steps": 15650, "total_steps": 40000, "loss": 0.1094, "lr": 0.2002671730796884, "epoch": 0.7646642073632521, "percentage": 39.12, "elapsed_time": "16:33:14", "remaining_time": "1 day, 1:45:23", "throughput": 332.74, "total_tokens": 19829472} {"current_steps": 15655, "total_steps": 40000, "loss": 0.0523, "lr": 0.20021167037437684, "epoch": 0.7649085090269465, "percentage": 39.14, "elapsed_time": "16:33:17", "remaining_time": "1 day, 1:44:39", "throughput": 332.83, "total_tokens": 19835872} {"current_steps": 15660, "total_steps": 40000, "loss": 0.0461, "lr": 0.20015615992579472, "epoch": 0.7651528106906408, "percentage": 39.15, "elapsed_time": "16:33:20", "remaining_time": "1 day, 1:43:55", "throughput": 332.92, "total_tokens": 19842080} {"current_steps": 15665, "total_steps": 40000, "loss": 0.0517, "lr": 0.20010064174250244, "epoch": 0.7653971123543352, "percentage": 39.16, "elapsed_time": "16:33:23", "remaining_time": "1 day, 1:43:11", "throughput": 333.01, "total_tokens": 19848352} {"current_steps": 15670, "total_steps": 40000, "loss": 0.1013, "lr": 0.2000451158330616, "epoch": 0.7656414140180294, "percentage": 39.17, "elapsed_time": "16:33:26", "remaining_time": "1 day, 1:42:27", "throughput": 333.09, "total_tokens": 19854528} {"current_steps": 15675, "total_steps": 40000, "loss": 0.0726, "lr": 0.199989582206035, "epoch": 0.7658857156817238, "percentage": 39.19, "elapsed_time": "16:33:29", "remaining_time": "1 day, 1:41:44", "throughput": 333.18, "total_tokens": 19860544} {"current_steps": 15680, "total_steps": 40000, "loss": 0.0733, "lr": 0.1999340408699866, "epoch": 0.7661300173454181, "percentage": 39.2, "elapsed_time": "16:33:32", "remaining_time": "1 day, 1:41:00", "throughput": 333.26, "total_tokens": 19866528} {"current_steps": 15685, "total_steps": 40000, "loss": 0.0989, "lr": 0.19987849183348155, "epoch": 0.7663743190091125, "percentage": 39.21, "elapsed_time": "16:33:35", "remaining_time": "1 day, 1:40:16", "throughput": 333.36, "total_tokens": 19873792} {"current_steps": 15690, "total_steps": 40000, "loss": 0.0652, "lr": 0.19982293510508628, "epoch": 0.7666186206728067, "percentage": 39.23, "elapsed_time": "16:33:38", "remaining_time": "1 day, 1:39:33", "throughput": 333.45, "total_tokens": 19879968} {"current_steps": 15695, "total_steps": 40000, "loss": 0.0833, "lr": 0.19976737069336833, "epoch": 0.7668629223365011, "percentage": 39.24, "elapsed_time": "16:33:41", "remaining_time": "1 day, 1:38:49", "throughput": 333.54, "total_tokens": 19886464} {"current_steps": 15700, "total_steps": 40000, "loss": 0.0547, "lr": 0.1997117986068964, "epoch": 0.7671072240001955, "percentage": 39.25, "elapsed_time": "16:33:45", "remaining_time": "1 day, 1:38:05", "throughput": 333.63, "total_tokens": 19892640} {"current_steps": 15705, "total_steps": 40000, "loss": 0.0569, "lr": 0.19965621885424037, "epoch": 0.7673515256638898, "percentage": 39.26, "elapsed_time": "16:33:48", "remaining_time": "1 day, 1:37:22", "throughput": 333.72, "total_tokens": 19898944} {"current_steps": 15710, "total_steps": 40000, "loss": 0.0797, "lr": 0.19960063144397142, "epoch": 0.7675958273275841, "percentage": 39.27, "elapsed_time": "16:33:51", "remaining_time": "1 day, 1:36:38", "throughput": 333.8, "total_tokens": 19904992} {"current_steps": 15715, "total_steps": 40000, "loss": 0.0562, "lr": 0.19954503638466176, "epoch": 0.7678401289912784, "percentage": 39.29, "elapsed_time": "16:33:54", "remaining_time": "1 day, 1:35:55", "throughput": 333.9, "total_tokens": 19911840} {"current_steps": 15720, "total_steps": 40000, "loss": 0.0662, "lr": 0.1994894336848848, "epoch": 0.7680844306549728, "percentage": 39.3, "elapsed_time": "16:33:57", "remaining_time": "1 day, 1:35:11", "throughput": 333.99, "total_tokens": 19918272} {"current_steps": 15725, "total_steps": 40000, "loss": 0.0564, "lr": 0.1994338233532153, "epoch": 0.768328732318667, "percentage": 39.31, "elapsed_time": "16:34:00", "remaining_time": "1 day, 1:34:28", "throughput": 334.07, "total_tokens": 19924160} {"current_steps": 15730, "total_steps": 40000, "loss": 0.0644, "lr": 0.19937820539822904, "epoch": 0.7685730339823614, "percentage": 39.32, "elapsed_time": "16:34:03", "remaining_time": "1 day, 1:33:44", "throughput": 334.16, "total_tokens": 19930464} {"current_steps": 15735, "total_steps": 40000, "loss": 0.05, "lr": 0.199322579828503, "epoch": 0.7688173356460557, "percentage": 39.34, "elapsed_time": "16:34:06", "remaining_time": "1 day, 1:33:01", "throughput": 334.25, "total_tokens": 19936544} {"current_steps": 15740, "total_steps": 40000, "loss": 0.073, "lr": 0.19926694665261527, "epoch": 0.7690616373097501, "percentage": 39.35, "elapsed_time": "16:34:09", "remaining_time": "1 day, 1:32:17", "throughput": 334.34, "total_tokens": 19943264} {"current_steps": 15745, "total_steps": 40000, "loss": 0.0545, "lr": 0.19921130587914526, "epoch": 0.7693059389734445, "percentage": 39.36, "elapsed_time": "16:34:12", "remaining_time": "1 day, 1:31:34", "throughput": 334.43, "total_tokens": 19949600} {"current_steps": 15750, "total_steps": 40000, "loss": 0.0431, "lr": 0.19915565751667344, "epoch": 0.7695502406371387, "percentage": 39.38, "elapsed_time": "16:34:15", "remaining_time": "1 day, 1:30:51", "throughput": 334.52, "total_tokens": 19956032} {"current_steps": 15755, "total_steps": 40000, "loss": 0.1037, "lr": 0.19910000157378152, "epoch": 0.7697945423008331, "percentage": 39.39, "elapsed_time": "16:34:19", "remaining_time": "1 day, 1:30:07", "throughput": 334.61, "total_tokens": 19962592} {"current_steps": 15760, "total_steps": 40000, "loss": 0.0719, "lr": 0.1990443380590523, "epoch": 0.7700388439645274, "percentage": 39.4, "elapsed_time": "16:34:22", "remaining_time": "1 day, 1:29:24", "throughput": 334.7, "total_tokens": 19968672} {"current_steps": 15765, "total_steps": 40000, "loss": 0.0535, "lr": 0.19898866698106984, "epoch": 0.7702831456282218, "percentage": 39.41, "elapsed_time": "16:34:25", "remaining_time": "1 day, 1:28:41", "throughput": 334.78, "total_tokens": 19974528} {"current_steps": 15770, "total_steps": 40000, "loss": 0.0627, "lr": 0.19893298834841933, "epoch": 0.770527447291916, "percentage": 39.42, "elapsed_time": "16:34:28", "remaining_time": "1 day, 1:27:57", "throughput": 334.87, "total_tokens": 19980928} {"current_steps": 15775, "total_steps": 40000, "loss": 0.0458, "lr": 0.19887730216968705, "epoch": 0.7707717489556104, "percentage": 39.44, "elapsed_time": "16:34:31", "remaining_time": "1 day, 1:27:14", "throughput": 334.96, "total_tokens": 19987296} {"current_steps": 15780, "total_steps": 40000, "loss": 0.0649, "lr": 0.19882160845346053, "epoch": 0.7710160506193047, "percentage": 39.45, "elapsed_time": "16:34:34", "remaining_time": "1 day, 1:26:31", "throughput": 335.04, "total_tokens": 19993408} {"current_steps": 15785, "total_steps": 40000, "loss": 0.0844, "lr": 0.1987659072083285, "epoch": 0.771260352282999, "percentage": 39.46, "elapsed_time": "16:34:37", "remaining_time": "1 day, 1:25:48", "throughput": 335.13, "total_tokens": 19999616} {"current_steps": 15790, "total_steps": 40000, "loss": 0.0858, "lr": 0.1987101984428807, "epoch": 0.7715046539466934, "percentage": 39.48, "elapsed_time": "16:34:40", "remaining_time": "1 day, 1:25:04", "throughput": 335.21, "total_tokens": 20005760} {"current_steps": 15795, "total_steps": 40000, "loss": 0.0885, "lr": 0.19865448216570822, "epoch": 0.7717489556103877, "percentage": 39.49, "elapsed_time": "16:34:43", "remaining_time": "1 day, 1:24:21", "throughput": 335.3, "total_tokens": 20012096} {"current_steps": 15800, "total_steps": 40000, "loss": 0.0396, "lr": 0.19859875838540317, "epoch": 0.7719932572740821, "percentage": 39.5, "elapsed_time": "16:34:46", "remaining_time": "1 day, 1:23:38", "throughput": 335.39, "total_tokens": 20018240} {"current_steps": 15800, "total_steps": 40000, "eval_loss": 0.0712004154920578, "epoch": 0.7719932572740821, "percentage": 39.5, "elapsed_time": "16:45:26", "remaining_time": "1 day, 1:39:59", "throughput": 331.83, "total_tokens": 20018240} {"current_steps": 15805, "total_steps": 40000, "loss": 0.0886, "lr": 0.1985430271105588, "epoch": 0.7722375589377763, "percentage": 39.51, "elapsed_time": "16:45:30", "remaining_time": "1 day, 1:39:16", "throughput": 331.9, "total_tokens": 20023904} {"current_steps": 15810, "total_steps": 40000, "loss": 0.0425, "lr": 0.19848728834976961, "epoch": 0.7724818606014707, "percentage": 39.52, "elapsed_time": "16:45:33", "remaining_time": "1 day, 1:38:33", "throughput": 331.99, "total_tokens": 20029984} {"current_steps": 15815, "total_steps": 40000, "loss": 0.0688, "lr": 0.19843154211163128, "epoch": 0.772726162265165, "percentage": 39.54, "elapsed_time": "16:45:36", "remaining_time": "1 day, 1:37:49", "throughput": 332.07, "total_tokens": 20035776} {"current_steps": 15820, "total_steps": 40000, "loss": 0.0612, "lr": 0.1983757884047405, "epoch": 0.7729704639288594, "percentage": 39.55, "elapsed_time": "16:45:39", "remaining_time": "1 day, 1:37:05", "throughput": 332.16, "total_tokens": 20042240} {"current_steps": 15825, "total_steps": 40000, "loss": 0.0531, "lr": 0.1983200272376952, "epoch": 0.7732147655925536, "percentage": 39.56, "elapsed_time": "16:45:42", "remaining_time": "1 day, 1:36:22", "throughput": 332.25, "total_tokens": 20048672} {"current_steps": 15830, "total_steps": 40000, "loss": 0.0801, "lr": 0.1982642586190945, "epoch": 0.773459067256248, "percentage": 39.57, "elapsed_time": "16:45:45", "remaining_time": "1 day, 1:35:38", "throughput": 332.33, "total_tokens": 20054688} {"current_steps": 15835, "total_steps": 40000, "loss": 0.0608, "lr": 0.1982084825575386, "epoch": 0.7737033689199423, "percentage": 39.59, "elapsed_time": "16:45:48", "remaining_time": "1 day, 1:34:55", "throughput": 332.42, "total_tokens": 20061472} {"current_steps": 15840, "total_steps": 40000, "loss": 0.0667, "lr": 0.19815269906162883, "epoch": 0.7739476705836367, "percentage": 39.6, "elapsed_time": "16:45:52", "remaining_time": "1 day, 1:34:12", "throughput": 332.51, "total_tokens": 20067776} {"current_steps": 15845, "total_steps": 40000, "loss": 0.0751, "lr": 0.19809690813996775, "epoch": 0.774191972247331, "percentage": 39.61, "elapsed_time": "16:45:55", "remaining_time": "1 day, 1:33:28", "throughput": 332.6, "total_tokens": 20073952} {"current_steps": 15850, "total_steps": 40000, "loss": 0.0656, "lr": 0.19804110980115905, "epoch": 0.7744362739110253, "percentage": 39.62, "elapsed_time": "16:45:58", "remaining_time": "1 day, 1:32:45", "throughput": 332.68, "total_tokens": 20080224} {"current_steps": 15855, "total_steps": 40000, "loss": 0.0649, "lr": 0.19798530405380746, "epoch": 0.7746805755747197, "percentage": 39.64, "elapsed_time": "16:46:01", "remaining_time": "1 day, 1:32:01", "throughput": 332.77, "total_tokens": 20086304} {"current_steps": 15860, "total_steps": 40000, "loss": 0.0738, "lr": 0.19792949090651893, "epoch": 0.774924877238414, "percentage": 39.65, "elapsed_time": "16:46:04", "remaining_time": "1 day, 1:31:18", "throughput": 332.86, "total_tokens": 20093152} {"current_steps": 15865, "total_steps": 40000, "loss": 0.0489, "lr": 0.19787367036790066, "epoch": 0.7751691789021083, "percentage": 39.66, "elapsed_time": "16:46:07", "remaining_time": "1 day, 1:30:35", "throughput": 332.96, "total_tokens": 20099808} {"current_steps": 15870, "total_steps": 40000, "loss": 0.0491, "lr": 0.19781784244656075, "epoch": 0.7754134805658026, "percentage": 39.67, "elapsed_time": "16:46:10", "remaining_time": "1 day, 1:29:52", "throughput": 333.04, "total_tokens": 20105664} {"current_steps": 15875, "total_steps": 40000, "loss": 0.0589, "lr": 0.19776200715110864, "epoch": 0.775657782229497, "percentage": 39.69, "elapsed_time": "16:46:13", "remaining_time": "1 day, 1:29:08", "throughput": 333.12, "total_tokens": 20111744} {"current_steps": 15880, "total_steps": 40000, "loss": 0.1086, "lr": 0.1977061644901548, "epoch": 0.7759020838931913, "percentage": 39.7, "elapsed_time": "16:46:16", "remaining_time": "1 day, 1:28:25", "throughput": 333.21, "total_tokens": 20118016} {"current_steps": 15885, "total_steps": 40000, "loss": 0.0651, "lr": 0.1976503144723109, "epoch": 0.7761463855568856, "percentage": 39.71, "elapsed_time": "16:46:19", "remaining_time": "1 day, 1:27:42", "throughput": 333.29, "total_tokens": 20123904} {"current_steps": 15890, "total_steps": 40000, "loss": 0.0719, "lr": 0.19759445710618967, "epoch": 0.77639068722058, "percentage": 39.73, "elapsed_time": "16:46:22", "remaining_time": "1 day, 1:26:59", "throughput": 333.37, "total_tokens": 20130016} {"current_steps": 15895, "total_steps": 40000, "loss": 0.0708, "lr": 0.19753859240040508, "epoch": 0.7766349888842743, "percentage": 39.74, "elapsed_time": "16:46:25", "remaining_time": "1 day, 1:26:15", "throughput": 333.46, "total_tokens": 20136032} {"current_steps": 15900, "total_steps": 40000, "loss": 0.0689, "lr": 0.1974827203635721, "epoch": 0.7768792905479687, "percentage": 39.75, "elapsed_time": "16:46:28", "remaining_time": "1 day, 1:25:32", "throughput": 333.55, "total_tokens": 20142688} {"current_steps": 15905, "total_steps": 40000, "loss": 0.0555, "lr": 0.19742684100430694, "epoch": 0.7771235922116629, "percentage": 39.76, "elapsed_time": "16:46:32", "remaining_time": "1 day, 1:24:49", "throughput": 333.64, "total_tokens": 20149120} {"current_steps": 15910, "total_steps": 40000, "loss": 0.0629, "lr": 0.19737095433122692, "epoch": 0.7773678938753573, "percentage": 39.77, "elapsed_time": "16:46:35", "remaining_time": "1 day, 1:24:06", "throughput": 333.73, "total_tokens": 20155456} {"current_steps": 15915, "total_steps": 40000, "loss": 0.0858, "lr": 0.19731506035295046, "epoch": 0.7776121955390516, "percentage": 39.79, "elapsed_time": "16:46:38", "remaining_time": "1 day, 1:23:23", "throughput": 333.82, "total_tokens": 20161952} {"current_steps": 15920, "total_steps": 40000, "loss": 0.0626, "lr": 0.19725915907809702, "epoch": 0.777856497202746, "percentage": 39.8, "elapsed_time": "16:46:41", "remaining_time": "1 day, 1:22:40", "throughput": 333.91, "total_tokens": 20168352} {"current_steps": 15925, "total_steps": 40000, "loss": 0.0745, "lr": 0.1972032505152874, "epoch": 0.7781007988664402, "percentage": 39.81, "elapsed_time": "16:46:44", "remaining_time": "1 day, 1:21:57", "throughput": 334.0, "total_tokens": 20175104} {"current_steps": 15930, "total_steps": 40000, "loss": 0.0577, "lr": 0.19714733467314338, "epoch": 0.7783451005301346, "percentage": 39.83, "elapsed_time": "16:46:47", "remaining_time": "1 day, 1:21:15", "throughput": 334.09, "total_tokens": 20181600} {"current_steps": 15935, "total_steps": 40000, "loss": 0.065, "lr": 0.19709141156028784, "epoch": 0.778589402193829, "percentage": 39.84, "elapsed_time": "16:46:50", "remaining_time": "1 day, 1:20:31", "throughput": 334.17, "total_tokens": 20187264} {"current_steps": 15940, "total_steps": 40000, "loss": 0.0721, "lr": 0.1970354811853448, "epoch": 0.7788337038575233, "percentage": 39.85, "elapsed_time": "16:46:53", "remaining_time": "1 day, 1:19:48", "throughput": 334.25, "total_tokens": 20193184} {"current_steps": 15945, "total_steps": 40000, "loss": 0.0692, "lr": 0.19697954355693953, "epoch": 0.7790780055212176, "percentage": 39.86, "elapsed_time": "16:46:56", "remaining_time": "1 day, 1:19:06", "throughput": 334.33, "total_tokens": 20199392} {"current_steps": 15950, "total_steps": 40000, "loss": 0.0543, "lr": 0.19692359868369827, "epoch": 0.7793223071849119, "percentage": 39.88, "elapsed_time": "16:46:59", "remaining_time": "1 day, 1:18:23", "throughput": 334.44, "total_tokens": 20206656} {"current_steps": 15955, "total_steps": 40000, "loss": 0.0638, "lr": 0.1968676465742484, "epoch": 0.7795666088486063, "percentage": 39.89, "elapsed_time": "16:47:03", "remaining_time": "1 day, 1:17:40", "throughput": 334.52, "total_tokens": 20212864} {"current_steps": 15960, "total_steps": 40000, "loss": 0.0715, "lr": 0.19681168723721845, "epoch": 0.7798109105123006, "percentage": 39.9, "elapsed_time": "16:47:06", "remaining_time": "1 day, 1:16:57", "throughput": 334.61, "total_tokens": 20219008} {"current_steps": 15965, "total_steps": 40000, "loss": 0.0529, "lr": 0.19675572068123803, "epoch": 0.7800552121759949, "percentage": 39.91, "elapsed_time": "16:47:09", "remaining_time": "1 day, 1:16:14", "throughput": 334.7, "total_tokens": 20225536} {"current_steps": 15970, "total_steps": 40000, "loss": 0.0803, "lr": 0.19669974691493794, "epoch": 0.7802995138396892, "percentage": 39.92, "elapsed_time": "16:47:12", "remaining_time": "1 day, 1:15:32", "throughput": 334.79, "total_tokens": 20232064} {"current_steps": 15975, "total_steps": 40000, "loss": 0.068, "lr": 0.19664376594695002, "epoch": 0.7805438155033836, "percentage": 39.94, "elapsed_time": "16:47:15", "remaining_time": "1 day, 1:14:49", "throughput": 334.87, "total_tokens": 20238080} {"current_steps": 15980, "total_steps": 40000, "loss": 0.0526, "lr": 0.19658777778590722, "epoch": 0.7807881171670779, "percentage": 39.95, "elapsed_time": "16:47:18", "remaining_time": "1 day, 1:14:06", "throughput": 334.96, "total_tokens": 20244128} {"current_steps": 15985, "total_steps": 40000, "loss": 0.0504, "lr": 0.19653178244044364, "epoch": 0.7810324188307722, "percentage": 39.96, "elapsed_time": "16:47:21", "remaining_time": "1 day, 1:13:23", "throughput": 335.04, "total_tokens": 20250208} {"current_steps": 15990, "total_steps": 40000, "loss": 0.0443, "lr": 0.19647577991919443, "epoch": 0.7812767204944666, "percentage": 39.98, "elapsed_time": "16:47:24", "remaining_time": "1 day, 1:12:41", "throughput": 335.13, "total_tokens": 20256768} {"current_steps": 15995, "total_steps": 40000, "loss": 0.0623, "lr": 0.1964197702307959, "epoch": 0.7815210221581609, "percentage": 39.99, "elapsed_time": "16:47:27", "remaining_time": "1 day, 1:11:58", "throughput": 335.22, "total_tokens": 20263040} {"current_steps": 16000, "total_steps": 40000, "loss": 0.0567, "lr": 0.19636375338388545, "epoch": 0.7817653238218553, "percentage": 40.0, "elapsed_time": "16:47:30", "remaining_time": "1 day, 1:11:15", "throughput": 335.31, "total_tokens": 20269632} {"current_steps": 16000, "total_steps": 40000, "eval_loss": 0.06630679965019226, "epoch": 0.7817653238218553, "percentage": 40.0, "elapsed_time": "16:58:10", "remaining_time": "1 day, 1:27:16", "throughput": 331.79, "total_tokens": 20269632} {"current_steps": 16005, "total_steps": 40000, "loss": 0.0629, "lr": 0.1963077293871016, "epoch": 0.7820096254855495, "percentage": 40.01, "elapsed_time": "16:58:14", "remaining_time": "1 day, 1:26:34", "throughput": 331.88, "total_tokens": 20275840} {"current_steps": 16010, "total_steps": 40000, "loss": 0.0465, "lr": 0.19625169824908395, "epoch": 0.7822539271492439, "percentage": 40.02, "elapsed_time": "16:58:17", "remaining_time": "1 day, 1:25:51", "throughput": 331.96, "total_tokens": 20282080} {"current_steps": 16015, "total_steps": 40000, "loss": 0.072, "lr": 0.19619565997847319, "epoch": 0.7824982288129382, "percentage": 40.04, "elapsed_time": "16:58:20", "remaining_time": "1 day, 1:25:08", "throughput": 332.04, "total_tokens": 20288064} {"current_steps": 16020, "total_steps": 40000, "loss": 0.07, "lr": 0.19613961458391113, "epoch": 0.7827425304766326, "percentage": 40.05, "elapsed_time": "16:58:23", "remaining_time": "1 day, 1:24:25", "throughput": 332.13, "total_tokens": 20294752} {"current_steps": 16025, "total_steps": 40000, "loss": 0.0706, "lr": 0.19608356207404065, "epoch": 0.7829868321403268, "percentage": 40.06, "elapsed_time": "16:58:27", "remaining_time": "1 day, 1:23:42", "throughput": 332.22, "total_tokens": 20300992} {"current_steps": 16030, "total_steps": 40000, "loss": 0.0422, "lr": 0.1960275024575058, "epoch": 0.7832311338040212, "percentage": 40.08, "elapsed_time": "16:58:30", "remaining_time": "1 day, 1:22:59", "throughput": 332.31, "total_tokens": 20307520} {"current_steps": 16035, "total_steps": 40000, "loss": 0.0748, "lr": 0.19597143574295164, "epoch": 0.7834754354677156, "percentage": 40.09, "elapsed_time": "16:58:33", "remaining_time": "1 day, 1:22:16", "throughput": 332.39, "total_tokens": 20313664} {"current_steps": 16040, "total_steps": 40000, "loss": 0.0737, "lr": 0.1959153619390244, "epoch": 0.7837197371314099, "percentage": 40.1, "elapsed_time": "16:58:36", "remaining_time": "1 day, 1:21:33", "throughput": 332.48, "total_tokens": 20320192} {"current_steps": 16045, "total_steps": 40000, "loss": 0.0686, "lr": 0.1958592810543713, "epoch": 0.7839640387951042, "percentage": 40.11, "elapsed_time": "16:58:39", "remaining_time": "1 day, 1:20:50", "throughput": 332.57, "total_tokens": 20326432} {"current_steps": 16050, "total_steps": 40000, "loss": 0.0664, "lr": 0.19580319309764077, "epoch": 0.7842083404587985, "percentage": 40.12, "elapsed_time": "16:58:42", "remaining_time": "1 day, 1:20:07", "throughput": 332.66, "total_tokens": 20332800} {"current_steps": 16055, "total_steps": 40000, "loss": 0.0721, "lr": 0.1957470980774823, "epoch": 0.7844526421224929, "percentage": 40.14, "elapsed_time": "16:58:45", "remaining_time": "1 day, 1:19:25", "throughput": 332.75, "total_tokens": 20339680} {"current_steps": 16060, "total_steps": 40000, "loss": 0.0558, "lr": 0.19569099600254639, "epoch": 0.7846969437861872, "percentage": 40.15, "elapsed_time": "16:58:48", "remaining_time": "1 day, 1:18:42", "throughput": 332.83, "total_tokens": 20345792} {"current_steps": 16065, "total_steps": 40000, "loss": 0.082, "lr": 0.1956348868814847, "epoch": 0.7849412454498815, "percentage": 40.16, "elapsed_time": "16:58:51", "remaining_time": "1 day, 1:17:59", "throughput": 332.93, "total_tokens": 20352416} {"current_steps": 16070, "total_steps": 40000, "loss": 0.0771, "lr": 0.19557877072295, "epoch": 0.7851855471135758, "percentage": 40.17, "elapsed_time": "16:58:55", "remaining_time": "1 day, 1:17:16", "throughput": 333.02, "total_tokens": 20358944} {"current_steps": 16075, "total_steps": 40000, "loss": 0.0745, "lr": 0.19552264753559603, "epoch": 0.7854298487772702, "percentage": 40.19, "elapsed_time": "16:58:58", "remaining_time": "1 day, 1:16:33", "throughput": 333.09, "total_tokens": 20364576} {"current_steps": 16080, "total_steps": 40000, "loss": 0.0364, "lr": 0.19546651732807774, "epoch": 0.7856741504409646, "percentage": 40.2, "elapsed_time": "16:59:01", "remaining_time": "1 day, 1:15:51", "throughput": 333.18, "total_tokens": 20370752} {"current_steps": 16085, "total_steps": 40000, "loss": 0.0716, "lr": 0.19541038010905112, "epoch": 0.7859184521046588, "percentage": 40.21, "elapsed_time": "16:59:04", "remaining_time": "1 day, 1:15:08", "throughput": 333.27, "total_tokens": 20377248} {"current_steps": 16090, "total_steps": 40000, "loss": 0.0501, "lr": 0.19535423588717324, "epoch": 0.7861627537683532, "percentage": 40.23, "elapsed_time": "16:59:07", "remaining_time": "1 day, 1:14:25", "throughput": 333.35, "total_tokens": 20383200} {"current_steps": 16095, "total_steps": 40000, "loss": 0.0578, "lr": 0.19529808467110224, "epoch": 0.7864070554320475, "percentage": 40.24, "elapsed_time": "16:59:10", "remaining_time": "1 day, 1:13:43", "throughput": 333.44, "total_tokens": 20390048} {"current_steps": 16100, "total_steps": 40000, "loss": 0.0826, "lr": 0.19524192646949734, "epoch": 0.7866513570957419, "percentage": 40.25, "elapsed_time": "16:59:13", "remaining_time": "1 day, 1:13:00", "throughput": 333.53, "total_tokens": 20396800} {"current_steps": 16105, "total_steps": 40000, "loss": 0.0806, "lr": 0.19518576129101878, "epoch": 0.7868956587594361, "percentage": 40.26, "elapsed_time": "16:59:16", "remaining_time": "1 day, 1:12:18", "throughput": 333.62, "total_tokens": 20403040} {"current_steps": 16110, "total_steps": 40000, "loss": 0.0596, "lr": 0.19512958914432804, "epoch": 0.7871399604231305, "percentage": 40.27, "elapsed_time": "16:59:19", "remaining_time": "1 day, 1:11:35", "throughput": 333.7, "total_tokens": 20409248} {"current_steps": 16115, "total_steps": 40000, "loss": 0.0688, "lr": 0.1950734100380875, "epoch": 0.7873842620868248, "percentage": 40.29, "elapsed_time": "16:59:22", "remaining_time": "1 day, 1:10:52", "throughput": 333.78, "total_tokens": 20414944} {"current_steps": 16120, "total_steps": 40000, "loss": 0.0598, "lr": 0.19501722398096066, "epoch": 0.7876285637505192, "percentage": 40.3, "elapsed_time": "16:59:25", "remaining_time": "1 day, 1:10:10", "throughput": 333.86, "total_tokens": 20421056} {"current_steps": 16125, "total_steps": 40000, "loss": 0.0732, "lr": 0.1949610309816122, "epoch": 0.7878728654142134, "percentage": 40.31, "elapsed_time": "16:59:28", "remaining_time": "1 day, 1:09:27", "throughput": 333.95, "total_tokens": 20427168} {"current_steps": 16130, "total_steps": 40000, "loss": 0.0582, "lr": 0.1949048310487078, "epoch": 0.7881171670779078, "percentage": 40.33, "elapsed_time": "16:59:31", "remaining_time": "1 day, 1:08:45", "throughput": 334.04, "total_tokens": 20433632} {"current_steps": 16135, "total_steps": 40000, "loss": 0.0775, "lr": 0.19484862419091406, "epoch": 0.7883614687416022, "percentage": 40.34, "elapsed_time": "16:59:35", "remaining_time": "1 day, 1:08:02", "throughput": 334.12, "total_tokens": 20439904} {"current_steps": 16140, "total_steps": 40000, "loss": 0.0484, "lr": 0.19479241041689893, "epoch": 0.7886057704052964, "percentage": 40.35, "elapsed_time": "16:59:38", "remaining_time": "1 day, 1:07:20", "throughput": 334.21, "total_tokens": 20446304} {"current_steps": 16145, "total_steps": 40000, "loss": 0.0501, "lr": 0.19473618973533116, "epoch": 0.7888500720689908, "percentage": 40.36, "elapsed_time": "16:59:41", "remaining_time": "1 day, 1:06:38", "throughput": 334.3, "total_tokens": 20452640} {"current_steps": 16150, "total_steps": 40000, "loss": 0.0841, "lr": 0.19467996215488076, "epoch": 0.7890943737326851, "percentage": 40.38, "elapsed_time": "16:59:44", "remaining_time": "1 day, 1:05:55", "throughput": 334.38, "total_tokens": 20458848} {"current_steps": 16155, "total_steps": 40000, "loss": 0.0537, "lr": 0.1946237276842187, "epoch": 0.7893386753963795, "percentage": 40.39, "elapsed_time": "16:59:47", "remaining_time": "1 day, 1:05:13", "throughput": 334.47, "total_tokens": 20465472} {"current_steps": 16160, "total_steps": 40000, "loss": 0.0534, "lr": 0.19456748633201712, "epoch": 0.7895829770600737, "percentage": 40.4, "elapsed_time": "16:59:50", "remaining_time": "1 day, 1:04:31", "throughput": 334.56, "total_tokens": 20472192} {"current_steps": 16165, "total_steps": 40000, "loss": 0.0581, "lr": 0.194511238106949, "epoch": 0.7898272787237681, "percentage": 40.41, "elapsed_time": "16:59:53", "remaining_time": "1 day, 1:03:48", "throughput": 334.65, "total_tokens": 20478208} {"current_steps": 16170, "total_steps": 40000, "loss": 0.0817, "lr": 0.19445498301768863, "epoch": 0.7900715803874624, "percentage": 40.42, "elapsed_time": "16:59:56", "remaining_time": "1 day, 1:03:06", "throughput": 334.73, "total_tokens": 20484544} {"current_steps": 16175, "total_steps": 40000, "loss": 0.0432, "lr": 0.19439872107291126, "epoch": 0.7903158820511568, "percentage": 40.44, "elapsed_time": "16:59:59", "remaining_time": "1 day, 1:02:24", "throughput": 334.82, "total_tokens": 20490944} {"current_steps": 16180, "total_steps": 40000, "loss": 0.0645, "lr": 0.1943424522812931, "epoch": 0.7905601837148512, "percentage": 40.45, "elapsed_time": "17:00:02", "remaining_time": "1 day, 1:01:42", "throughput": 334.9, "total_tokens": 20496928} {"current_steps": 16185, "total_steps": 40000, "loss": 0.0546, "lr": 0.19428617665151157, "epoch": 0.7908044853785454, "percentage": 40.46, "elapsed_time": "17:00:06", "remaining_time": "1 day, 1:01:00", "throughput": 334.99, "total_tokens": 20503552} {"current_steps": 16190, "total_steps": 40000, "loss": 0.0453, "lr": 0.19422989419224507, "epoch": 0.7910487870422398, "percentage": 40.48, "elapsed_time": "17:00:09", "remaining_time": "1 day, 1:00:17", "throughput": 335.08, "total_tokens": 20510112} {"current_steps": 16195, "total_steps": 40000, "loss": 0.0672, "lr": 0.19417360491217303, "epoch": 0.7912930887059341, "percentage": 40.49, "elapsed_time": "17:00:12", "remaining_time": "1 day, 0:59:35", "throughput": 335.17, "total_tokens": 20516736} {"current_steps": 16200, "total_steps": 40000, "loss": 0.0626, "lr": 0.19411730881997605, "epoch": 0.7915373903696284, "percentage": 40.5, "elapsed_time": "17:00:15", "remaining_time": "1 day, 0:58:53", "throughput": 335.26, "total_tokens": 20523232} {"current_steps": 16200, "total_steps": 40000, "eval_loss": 0.06604218482971191, "epoch": 0.7915373903696284, "percentage": 40.5, "elapsed_time": "17:10:55", "remaining_time": "1 day, 1:14:33", "throughput": 331.79, "total_tokens": 20523232} {"current_steps": 16205, "total_steps": 40000, "loss": 0.0742, "lr": 0.1940610059243356, "epoch": 0.7917816920333227, "percentage": 40.51, "elapsed_time": "17:10:59", "remaining_time": "1 day, 1:13:52", "throughput": 331.87, "total_tokens": 20529344} {"current_steps": 16210, "total_steps": 40000, "loss": 0.0686, "lr": 0.19400469623393435, "epoch": 0.7920259936970171, "percentage": 40.52, "elapsed_time": "17:11:02", "remaining_time": "1 day, 1:13:10", "throughput": 331.96, "total_tokens": 20536192} {"current_steps": 16215, "total_steps": 40000, "loss": 0.041, "lr": 0.1939483797574559, "epoch": 0.7922702953607114, "percentage": 40.54, "elapsed_time": "17:11:05", "remaining_time": "1 day, 1:12:27", "throughput": 332.05, "total_tokens": 20542240} {"current_steps": 16220, "total_steps": 40000, "loss": 0.0299, "lr": 0.19389205650358504, "epoch": 0.7925145970244057, "percentage": 40.55, "elapsed_time": "17:11:08", "remaining_time": "1 day, 1:11:45", "throughput": 332.14, "total_tokens": 20548960} {"current_steps": 16225, "total_steps": 40000, "loss": 0.0662, "lr": 0.19383572648100747, "epoch": 0.7927588986881, "percentage": 40.56, "elapsed_time": "17:11:11", "remaining_time": "1 day, 1:11:02", "throughput": 332.22, "total_tokens": 20555168} {"current_steps": 16230, "total_steps": 40000, "loss": 0.0342, "lr": 0.19377938969841, "epoch": 0.7930032003517944, "percentage": 40.58, "elapsed_time": "17:11:14", "remaining_time": "1 day, 1:10:20", "throughput": 332.31, "total_tokens": 20561568} {"current_steps": 16235, "total_steps": 40000, "loss": 0.1032, "lr": 0.1937230461644805, "epoch": 0.7932475020154888, "percentage": 40.59, "elapsed_time": "17:11:17", "remaining_time": "1 day, 1:09:37", "throughput": 332.4, "total_tokens": 20568192} {"current_steps": 16240, "total_steps": 40000, "loss": 0.0846, "lr": 0.19366669588790777, "epoch": 0.793491803679183, "percentage": 40.6, "elapsed_time": "17:11:21", "remaining_time": "1 day, 1:08:55", "throughput": 332.49, "total_tokens": 20574816} {"current_steps": 16245, "total_steps": 40000, "loss": 0.0504, "lr": 0.19361033887738185, "epoch": 0.7937361053428774, "percentage": 40.61, "elapsed_time": "17:11:24", "remaining_time": "1 day, 1:08:13", "throughput": 332.58, "total_tokens": 20581280} {"current_steps": 16250, "total_steps": 40000, "loss": 0.0456, "lr": 0.19355397514159361, "epoch": 0.7939804070065717, "percentage": 40.62, "elapsed_time": "17:11:27", "remaining_time": "1 day, 1:07:30", "throughput": 332.66, "total_tokens": 20587744} {"current_steps": 16255, "total_steps": 40000, "loss": 0.039, "lr": 0.19349760468923508, "epoch": 0.7942247086702661, "percentage": 40.64, "elapsed_time": "17:11:30", "remaining_time": "1 day, 1:06:48", "throughput": 332.74, "total_tokens": 20593664} {"current_steps": 16260, "total_steps": 40000, "loss": 0.0462, "lr": 0.19344122752899925, "epoch": 0.7944690103339603, "percentage": 40.65, "elapsed_time": "17:11:33", "remaining_time": "1 day, 1:06:06", "throughput": 332.83, "total_tokens": 20600064} {"current_steps": 16265, "total_steps": 40000, "loss": 0.09, "lr": 0.1933848436695802, "epoch": 0.7947133119976547, "percentage": 40.66, "elapsed_time": "17:11:36", "remaining_time": "1 day, 1:05:23", "throughput": 332.92, "total_tokens": 20606304} {"current_steps": 16270, "total_steps": 40000, "loss": 0.0481, "lr": 0.1933284531196731, "epoch": 0.794957613661349, "percentage": 40.67, "elapsed_time": "17:11:39", "remaining_time": "1 day, 1:04:41", "throughput": 333.0, "total_tokens": 20612416} {"current_steps": 16275, "total_steps": 40000, "loss": 0.0734, "lr": 0.19327205588797403, "epoch": 0.7952019153250434, "percentage": 40.69, "elapsed_time": "17:11:42", "remaining_time": "1 day, 1:03:59", "throughput": 333.08, "total_tokens": 20618848} {"current_steps": 16280, "total_steps": 40000, "loss": 0.0813, "lr": 0.19321565198318014, "epoch": 0.7954462169887377, "percentage": 40.7, "elapsed_time": "17:11:45", "remaining_time": "1 day, 1:03:16", "throughput": 333.17, "total_tokens": 20625280} {"current_steps": 16285, "total_steps": 40000, "loss": 0.039, "lr": 0.1931592414139896, "epoch": 0.795690518652432, "percentage": 40.71, "elapsed_time": "17:11:49", "remaining_time": "1 day, 1:02:34", "throughput": 333.27, "total_tokens": 20632352} {"current_steps": 16290, "total_steps": 40000, "loss": 0.0405, "lr": 0.19310282418910169, "epoch": 0.7959348203161264, "percentage": 40.73, "elapsed_time": "17:11:52", "remaining_time": "1 day, 1:01:52", "throughput": 333.35, "total_tokens": 20638560} {"current_steps": 16295, "total_steps": 40000, "loss": 0.069, "lr": 0.1930464003172166, "epoch": 0.7961791219798207, "percentage": 40.74, "elapsed_time": "17:11:55", "remaining_time": "1 day, 1:01:10", "throughput": 333.43, "total_tokens": 20644384} {"current_steps": 16300, "total_steps": 40000, "loss": 0.0615, "lr": 0.19298996980703567, "epoch": 0.796423423643515, "percentage": 40.75, "elapsed_time": "17:11:58", "remaining_time": "1 day, 1:00:28", "throughput": 333.52, "total_tokens": 20650912} {"current_steps": 16305, "total_steps": 40000, "loss": 0.056, "lr": 0.19293353266726113, "epoch": 0.7966677253072093, "percentage": 40.76, "elapsed_time": "17:12:01", "remaining_time": "1 day, 0:59:46", "throughput": 333.61, "total_tokens": 20657280} {"current_steps": 16310, "total_steps": 40000, "loss": 0.0689, "lr": 0.19287708890659633, "epoch": 0.7969120269709037, "percentage": 40.77, "elapsed_time": "17:12:04", "remaining_time": "1 day, 0:59:04", "throughput": 333.69, "total_tokens": 20663616} {"current_steps": 16315, "total_steps": 40000, "loss": 0.0453, "lr": 0.19282063853374556, "epoch": 0.797156328634598, "percentage": 40.79, "elapsed_time": "17:12:07", "remaining_time": "1 day, 0:58:22", "throughput": 333.78, "total_tokens": 20670208} {"current_steps": 16320, "total_steps": 40000, "loss": 0.0457, "lr": 0.19276418155741423, "epoch": 0.7974006302982923, "percentage": 40.8, "elapsed_time": "17:12:10", "remaining_time": "1 day, 0:57:40", "throughput": 333.87, "total_tokens": 20676608} {"current_steps": 16325, "total_steps": 40000, "loss": 0.0484, "lr": 0.19270771798630867, "epoch": 0.7976449319619867, "percentage": 40.81, "elapsed_time": "17:12:13", "remaining_time": "1 day, 0:56:58", "throughput": 333.96, "total_tokens": 20683104} {"current_steps": 16330, "total_steps": 40000, "loss": 0.049, "lr": 0.1926512478291363, "epoch": 0.797889233625681, "percentage": 40.83, "elapsed_time": "17:12:16", "remaining_time": "1 day, 0:56:16", "throughput": 334.04, "total_tokens": 20689440} {"current_steps": 16335, "total_steps": 40000, "loss": 0.0486, "lr": 0.19259477109460557, "epoch": 0.7981335352893754, "percentage": 40.84, "elapsed_time": "17:12:19", "remaining_time": "1 day, 0:55:34", "throughput": 334.12, "total_tokens": 20695648} {"current_steps": 16340, "total_steps": 40000, "loss": 0.066, "lr": 0.19253828779142584, "epoch": 0.7983778369530696, "percentage": 40.85, "elapsed_time": "17:12:22", "remaining_time": "1 day, 0:54:52", "throughput": 334.21, "total_tokens": 20701824} {"current_steps": 16345, "total_steps": 40000, "loss": 0.057, "lr": 0.19248179792830755, "epoch": 0.798622138616764, "percentage": 40.86, "elapsed_time": "17:12:26", "remaining_time": "1 day, 0:54:10", "throughput": 334.29, "total_tokens": 20708192} {"current_steps": 16350, "total_steps": 40000, "loss": 0.1068, "lr": 0.19242530151396217, "epoch": 0.7988664402804583, "percentage": 40.88, "elapsed_time": "17:12:29", "remaining_time": "1 day, 0:53:28", "throughput": 334.37, "total_tokens": 20713856} {"current_steps": 16355, "total_steps": 40000, "loss": 0.0745, "lr": 0.19236879855710215, "epoch": 0.7991107419441527, "percentage": 40.89, "elapsed_time": "17:12:31", "remaining_time": "1 day, 0:52:46", "throughput": 334.45, "total_tokens": 20719552} {"current_steps": 16360, "total_steps": 40000, "loss": 0.0705, "lr": 0.19231228906644096, "epoch": 0.7993550436078469, "percentage": 40.9, "elapsed_time": "17:12:34", "remaining_time": "1 day, 0:52:04", "throughput": 334.53, "total_tokens": 20725472} {"current_steps": 16365, "total_steps": 40000, "loss": 0.091, "lr": 0.19225577305069302, "epoch": 0.7995993452715413, "percentage": 40.91, "elapsed_time": "17:12:38", "remaining_time": "1 day, 0:51:22", "throughput": 334.62, "total_tokens": 20732160} {"current_steps": 16370, "total_steps": 40000, "loss": 0.0562, "lr": 0.1921992505185739, "epoch": 0.7998436469352356, "percentage": 40.92, "elapsed_time": "17:12:41", "remaining_time": "1 day, 0:50:40", "throughput": 334.7, "total_tokens": 20738592} {"current_steps": 16375, "total_steps": 40000, "loss": 0.0568, "lr": 0.19214272147880004, "epoch": 0.80008794859893, "percentage": 40.94, "elapsed_time": "17:12:44", "remaining_time": "1 day, 0:49:58", "throughput": 334.78, "total_tokens": 20744672} {"current_steps": 16380, "total_steps": 40000, "loss": 0.0412, "lr": 0.19208618594008892, "epoch": 0.8003322502626243, "percentage": 40.95, "elapsed_time": "17:12:47", "remaining_time": "1 day, 0:49:17", "throughput": 334.88, "total_tokens": 20751552} {"current_steps": 16385, "total_steps": 40000, "loss": 0.0996, "lr": 0.19202964391115904, "epoch": 0.8005765519263186, "percentage": 40.96, "elapsed_time": "17:12:50", "remaining_time": "1 day, 0:48:35", "throughput": 334.97, "total_tokens": 20757984} {"current_steps": 16390, "total_steps": 40000, "loss": 0.0833, "lr": 0.1919730954007299, "epoch": 0.800820853590013, "percentage": 40.98, "elapsed_time": "17:12:53", "remaining_time": "1 day, 0:47:53", "throughput": 335.05, "total_tokens": 20764480} {"current_steps": 16395, "total_steps": 40000, "loss": 0.0699, "lr": 0.19191654041752199, "epoch": 0.8010651552537073, "percentage": 40.99, "elapsed_time": "17:12:56", "remaining_time": "1 day, 0:47:12", "throughput": 335.14, "total_tokens": 20770816} {"current_steps": 16400, "total_steps": 40000, "loss": 0.0941, "lr": 0.19185997897025678, "epoch": 0.8013094569174016, "percentage": 41.0, "elapsed_time": "17:13:00", "remaining_time": "1 day, 0:46:30", "throughput": 335.23, "total_tokens": 20777376} {"current_steps": 16400, "total_steps": 40000, "eval_loss": 0.07804276794195175, "epoch": 0.8013094569174016, "percentage": 41.0, "elapsed_time": "17:23:40", "remaining_time": "1 day, 1:01:52", "throughput": 331.8, "total_tokens": 20777376} {"current_steps": 16405, "total_steps": 40000, "loss": 0.0584, "lr": 0.19180341106765672, "epoch": 0.8015537585810959, "percentage": 41.01, "elapsed_time": "17:23:44", "remaining_time": "1 day, 1:01:11", "throughput": 331.89, "total_tokens": 20784096} {"current_steps": 16410, "total_steps": 40000, "loss": 0.0565, "lr": 0.19174683671844536, "epoch": 0.8017980602447903, "percentage": 41.02, "elapsed_time": "17:23:47", "remaining_time": "1 day, 1:00:29", "throughput": 331.97, "total_tokens": 20790560} {"current_steps": 16415, "total_steps": 40000, "loss": 0.0417, "lr": 0.19169025593134717, "epoch": 0.8020423619084845, "percentage": 41.04, "elapsed_time": "17:23:50", "remaining_time": "1 day, 0:59:47", "throughput": 332.06, "total_tokens": 20797120} {"current_steps": 16420, "total_steps": 40000, "loss": 0.0658, "lr": 0.19163366871508764, "epoch": 0.8022866635721789, "percentage": 41.05, "elapsed_time": "17:23:53", "remaining_time": "1 day, 0:59:05", "throughput": 332.15, "total_tokens": 20803648} {"current_steps": 16425, "total_steps": 40000, "loss": 0.071, "lr": 0.19157707507839317, "epoch": 0.8025309652358733, "percentage": 41.06, "elapsed_time": "17:23:56", "remaining_time": "1 day, 0:58:23", "throughput": 332.23, "total_tokens": 20809984} {"current_steps": 16430, "total_steps": 40000, "loss": 0.034, "lr": 0.19152047502999123, "epoch": 0.8027752668995676, "percentage": 41.08, "elapsed_time": "17:23:59", "remaining_time": "1 day, 0:57:41", "throughput": 332.32, "total_tokens": 20816224} {"current_steps": 16435, "total_steps": 40000, "loss": 0.0364, "lr": 0.19146386857861025, "epoch": 0.803019568563262, "percentage": 41.09, "elapsed_time": "17:24:02", "remaining_time": "1 day, 0:56:59", "throughput": 332.41, "total_tokens": 20822848} {"current_steps": 16440, "total_steps": 40000, "loss": 0.0954, "lr": 0.19140725573297968, "epoch": 0.8032638702269562, "percentage": 41.1, "elapsed_time": "17:24:05", "remaining_time": "1 day, 0:56:17", "throughput": 332.49, "total_tokens": 20828960} {"current_steps": 16445, "total_steps": 40000, "loss": 0.079, "lr": 0.19135063650182987, "epoch": 0.8035081718906506, "percentage": 41.11, "elapsed_time": "17:24:08", "remaining_time": "1 day, 0:55:35", "throughput": 332.57, "total_tokens": 20835104} {"current_steps": 16450, "total_steps": 40000, "loss": 0.0754, "lr": 0.19129401089389234, "epoch": 0.8037524735543449, "percentage": 41.12, "elapsed_time": "17:24:12", "remaining_time": "1 day, 0:54:53", "throughput": 332.66, "total_tokens": 20841696} {"current_steps": 16455, "total_steps": 40000, "loss": 0.0681, "lr": 0.19123737891789938, "epoch": 0.8039967752180393, "percentage": 41.14, "elapsed_time": "17:24:15", "remaining_time": "1 day, 0:54:11", "throughput": 332.74, "total_tokens": 20848032} {"current_steps": 16460, "total_steps": 40000, "loss": 0.0846, "lr": 0.19118074058258439, "epoch": 0.8042410768817335, "percentage": 41.15, "elapsed_time": "17:24:18", "remaining_time": "1 day, 0:53:29", "throughput": 332.83, "total_tokens": 20854400} {"current_steps": 16465, "total_steps": 40000, "loss": 0.0768, "lr": 0.1911240958966816, "epoch": 0.8044853785454279, "percentage": 41.16, "elapsed_time": "17:24:21", "remaining_time": "1 day, 0:52:47", "throughput": 332.91, "total_tokens": 20860512} {"current_steps": 16470, "total_steps": 40000, "loss": 0.0811, "lr": 0.19106744486892652, "epoch": 0.8047296802091223, "percentage": 41.17, "elapsed_time": "17:24:24", "remaining_time": "1 day, 0:52:06", "throughput": 333.0, "total_tokens": 20867200} {"current_steps": 16475, "total_steps": 40000, "loss": 0.0709, "lr": 0.1910107875080553, "epoch": 0.8049739818728165, "percentage": 41.19, "elapsed_time": "17:24:27", "remaining_time": "1 day, 0:51:24", "throughput": 333.08, "total_tokens": 20873056} {"current_steps": 16480, "total_steps": 40000, "loss": 0.046, "lr": 0.19095412382280533, "epoch": 0.8052182835365109, "percentage": 41.2, "elapsed_time": "17:24:30", "remaining_time": "1 day, 0:50:42", "throughput": 333.16, "total_tokens": 20879584} {"current_steps": 16485, "total_steps": 40000, "loss": 0.0787, "lr": 0.19089745382191473, "epoch": 0.8054625852002052, "percentage": 41.21, "elapsed_time": "17:24:33", "remaining_time": "1 day, 0:50:00", "throughput": 333.25, "total_tokens": 20886176} {"current_steps": 16490, "total_steps": 40000, "loss": 0.0602, "lr": 0.19084077751412284, "epoch": 0.8057068868638996, "percentage": 41.23, "elapsed_time": "17:24:36", "remaining_time": "1 day, 0:49:19", "throughput": 333.34, "total_tokens": 20892416} {"current_steps": 16495, "total_steps": 40000, "loss": 0.0801, "lr": 0.19078409490816986, "epoch": 0.8059511885275938, "percentage": 41.24, "elapsed_time": "17:24:39", "remaining_time": "1 day, 0:48:37", "throughput": 333.42, "total_tokens": 20898688} {"current_steps": 16500, "total_steps": 40000, "loss": 0.0859, "lr": 0.19072740601279686, "epoch": 0.8061954901912882, "percentage": 41.25, "elapsed_time": "17:24:42", "remaining_time": "1 day, 0:47:55", "throughput": 333.5, "total_tokens": 20904768} {"current_steps": 16505, "total_steps": 40000, "loss": 0.0625, "lr": 0.19067071083674605, "epoch": 0.8064397918549825, "percentage": 41.26, "elapsed_time": "17:24:45", "remaining_time": "1 day, 0:47:13", "throughput": 333.58, "total_tokens": 20910912} {"current_steps": 16510, "total_steps": 40000, "loss": 0.0557, "lr": 0.19061400938876052, "epoch": 0.8066840935186769, "percentage": 41.27, "elapsed_time": "17:24:48", "remaining_time": "1 day, 0:46:32", "throughput": 333.66, "total_tokens": 20917120} {"current_steps": 16515, "total_steps": 40000, "loss": 0.0505, "lr": 0.1905573016775844, "epoch": 0.8069283951823711, "percentage": 41.29, "elapsed_time": "17:24:52", "remaining_time": "1 day, 0:45:50", "throughput": 333.74, "total_tokens": 20923104} {"current_steps": 16520, "total_steps": 40000, "loss": 0.0582, "lr": 0.19050058771196263, "epoch": 0.8071726968460655, "percentage": 41.3, "elapsed_time": "17:24:55", "remaining_time": "1 day, 0:45:08", "throughput": 333.83, "total_tokens": 20929440} {"current_steps": 16525, "total_steps": 40000, "loss": 0.0522, "lr": 0.19044386750064132, "epoch": 0.8074169985097599, "percentage": 41.31, "elapsed_time": "17:24:58", "remaining_time": "1 day, 0:44:27", "throughput": 333.92, "total_tokens": 20935936} {"current_steps": 16530, "total_steps": 40000, "loss": 0.0686, "lr": 0.19038714105236737, "epoch": 0.8076613001734542, "percentage": 41.33, "elapsed_time": "17:25:01", "remaining_time": "1 day, 0:43:46", "throughput": 334.0, "total_tokens": 20942432} {"current_steps": 16535, "total_steps": 40000, "loss": 0.0948, "lr": 0.19033040837588874, "epoch": 0.8079056018371485, "percentage": 41.34, "elapsed_time": "17:25:04", "remaining_time": "1 day, 0:43:04", "throughput": 334.1, "total_tokens": 20949536} {"current_steps": 16540, "total_steps": 40000, "loss": 0.0726, "lr": 0.1902736694799543, "epoch": 0.8081499035008428, "percentage": 41.35, "elapsed_time": "17:25:07", "remaining_time": "1 day, 0:42:23", "throughput": 334.18, "total_tokens": 20955776} {"current_steps": 16545, "total_steps": 40000, "loss": 0.0543, "lr": 0.19021692437331392, "epoch": 0.8083942051645372, "percentage": 41.36, "elapsed_time": "17:25:10", "remaining_time": "1 day, 0:41:41", "throughput": 334.27, "total_tokens": 20962176} {"current_steps": 16550, "total_steps": 40000, "loss": 0.0507, "lr": 0.1901601730647184, "epoch": 0.8086385068282315, "percentage": 41.38, "elapsed_time": "17:25:13", "remaining_time": "1 day, 0:41:00", "throughput": 334.34, "total_tokens": 20968000} {"current_steps": 16555, "total_steps": 40000, "loss": 0.0676, "lr": 0.19010341556291954, "epoch": 0.8088828084919258, "percentage": 41.39, "elapsed_time": "17:25:16", "remaining_time": "1 day, 0:40:18", "throughput": 334.43, "total_tokens": 20974688} {"current_steps": 16560, "total_steps": 40000, "loss": 0.0864, "lr": 0.19004665187667, "epoch": 0.8091271101556201, "percentage": 41.4, "elapsed_time": "17:25:20", "remaining_time": "1 day, 0:39:37", "throughput": 334.53, "total_tokens": 20981696} {"current_steps": 16565, "total_steps": 40000, "loss": 0.0892, "lr": 0.1899898820147235, "epoch": 0.8093714118193145, "percentage": 41.41, "elapsed_time": "17:25:23", "remaining_time": "1 day, 0:38:56", "throughput": 334.61, "total_tokens": 20987712} {"current_steps": 16570, "total_steps": 40000, "loss": 0.0552, "lr": 0.18993310598583465, "epoch": 0.8096157134830089, "percentage": 41.42, "elapsed_time": "17:25:26", "remaining_time": "1 day, 0:38:15", "throughput": 334.69, "total_tokens": 20994080} {"current_steps": 16575, "total_steps": 40000, "loss": 0.0999, "lr": 0.18987632379875904, "epoch": 0.8098600151467031, "percentage": 41.44, "elapsed_time": "17:25:29", "remaining_time": "1 day, 0:37:33", "throughput": 334.78, "total_tokens": 21000352} {"current_steps": 16580, "total_steps": 40000, "loss": 0.0785, "lr": 0.18981953546225314, "epoch": 0.8101043168103975, "percentage": 41.45, "elapsed_time": "17:25:32", "remaining_time": "1 day, 0:36:52", "throughput": 334.87, "total_tokens": 21006976} {"current_steps": 16585, "total_steps": 40000, "loss": 0.0749, "lr": 0.18976274098507445, "epoch": 0.8103486184740918, "percentage": 41.46, "elapsed_time": "17:25:35", "remaining_time": "1 day, 0:36:11", "throughput": 334.95, "total_tokens": 21013280} {"current_steps": 16590, "total_steps": 40000, "loss": 0.0473, "lr": 0.18970594037598146, "epoch": 0.8105929201377862, "percentage": 41.48, "elapsed_time": "17:25:38", "remaining_time": "1 day, 0:35:29", "throughput": 335.04, "total_tokens": 21019680} {"current_steps": 16595, "total_steps": 40000, "loss": 0.0692, "lr": 0.1896491336437335, "epoch": 0.8108372218014804, "percentage": 41.49, "elapsed_time": "17:25:41", "remaining_time": "1 day, 0:34:48", "throughput": 335.11, "total_tokens": 21025600} {"current_steps": 16600, "total_steps": 40000, "loss": 0.0905, "lr": 0.18959232079709085, "epoch": 0.8110815234651748, "percentage": 41.5, "elapsed_time": "17:25:44", "remaining_time": "1 day, 0:34:07", "throughput": 335.2, "total_tokens": 21031776} {"current_steps": 16600, "total_steps": 40000, "eval_loss": 0.06692992150783539, "epoch": 0.8110815234651748, "percentage": 41.5, "elapsed_time": "17:36:25", "remaining_time": "1 day, 0:49:10", "throughput": 331.81, "total_tokens": 21031776} {"current_steps": 16605, "total_steps": 40000, "loss": 0.0695, "lr": 0.18953550184481477, "epoch": 0.8113258251288691, "percentage": 41.51, "elapsed_time": "17:36:28", "remaining_time": "1 day, 0:48:29", "throughput": 331.89, "total_tokens": 21038048} {"current_steps": 16610, "total_steps": 40000, "loss": 0.0722, "lr": 0.18947867679566752, "epoch": 0.8115701267925635, "percentage": 41.52, "elapsed_time": "17:36:31", "remaining_time": "1 day, 0:47:47", "throughput": 331.97, "total_tokens": 21044352} {"current_steps": 16615, "total_steps": 40000, "loss": 0.0703, "lr": 0.18942184565841216, "epoch": 0.8118144284562578, "percentage": 41.54, "elapsed_time": "17:36:34", "remaining_time": "1 day, 0:47:06", "throughput": 332.06, "total_tokens": 21050752} {"current_steps": 16620, "total_steps": 40000, "loss": 0.0542, "lr": 0.18936500844181278, "epoch": 0.8120587301199521, "percentage": 41.55, "elapsed_time": "17:36:38", "remaining_time": "1 day, 0:46:24", "throughput": 332.14, "total_tokens": 21057184} {"current_steps": 16625, "total_steps": 40000, "loss": 0.0643, "lr": 0.18930816515463436, "epoch": 0.8123030317836465, "percentage": 41.56, "elapsed_time": "17:36:41", "remaining_time": "1 day, 0:45:43", "throughput": 332.23, "total_tokens": 21063680} {"current_steps": 16630, "total_steps": 40000, "loss": 0.0589, "lr": 0.18925131580564297, "epoch": 0.8125473334473408, "percentage": 41.58, "elapsed_time": "17:36:44", "remaining_time": "1 day, 0:45:01", "throughput": 332.32, "total_tokens": 21070400} {"current_steps": 16635, "total_steps": 40000, "loss": 0.0632, "lr": 0.1891944604036054, "epoch": 0.8127916351110351, "percentage": 41.59, "elapsed_time": "17:36:47", "remaining_time": "1 day, 0:44:20", "throughput": 332.4, "total_tokens": 21076320} {"current_steps": 16640, "total_steps": 40000, "loss": 0.0673, "lr": 0.1891375989572895, "epoch": 0.8130359367747294, "percentage": 41.6, "elapsed_time": "17:36:50", "remaining_time": "1 day, 0:43:38", "throughput": 332.48, "total_tokens": 21082848} {"current_steps": 16645, "total_steps": 40000, "loss": 0.0526, "lr": 0.18908073147546398, "epoch": 0.8132802384384238, "percentage": 41.61, "elapsed_time": "17:36:53", "remaining_time": "1 day, 0:42:57", "throughput": 332.57, "total_tokens": 21089312} {"current_steps": 16650, "total_steps": 40000, "loss": 0.0467, "lr": 0.18902385796689858, "epoch": 0.813524540102118, "percentage": 41.62, "elapsed_time": "17:36:56", "remaining_time": "1 day, 0:42:15", "throughput": 332.65, "total_tokens": 21095456} {"current_steps": 16655, "total_steps": 40000, "loss": 0.0521, "lr": 0.18896697844036384, "epoch": 0.8137688417658124, "percentage": 41.64, "elapsed_time": "17:36:59", "remaining_time": "1 day, 0:41:34", "throughput": 332.74, "total_tokens": 21102080} {"current_steps": 16660, "total_steps": 40000, "loss": 0.0405, "lr": 0.18891009290463137, "epoch": 0.8140131434295067, "percentage": 41.65, "elapsed_time": "17:37:02", "remaining_time": "1 day, 0:40:53", "throughput": 332.82, "total_tokens": 21108256} {"current_steps": 16665, "total_steps": 40000, "loss": 0.1127, "lr": 0.18885320136847353, "epoch": 0.8142574450932011, "percentage": 41.66, "elapsed_time": "17:37:05", "remaining_time": "1 day, 0:40:11", "throughput": 332.9, "total_tokens": 21114272} {"current_steps": 16670, "total_steps": 40000, "loss": 0.0477, "lr": 0.1887963038406639, "epoch": 0.8145017467568955, "percentage": 41.68, "elapsed_time": "17:37:09", "remaining_time": "1 day, 0:39:30", "throughput": 332.98, "total_tokens": 21120416} {"current_steps": 16675, "total_steps": 40000, "loss": 0.0659, "lr": 0.18873940032997658, "epoch": 0.8147460484205897, "percentage": 41.69, "elapsed_time": "17:37:12", "remaining_time": "1 day, 0:38:48", "throughput": 333.06, "total_tokens": 21126432} {"current_steps": 16680, "total_steps": 40000, "loss": 0.0513, "lr": 0.18868249084518693, "epoch": 0.8149903500842841, "percentage": 41.7, "elapsed_time": "17:37:15", "remaining_time": "1 day, 0:38:07", "throughput": 333.14, "total_tokens": 21132864} {"current_steps": 16685, "total_steps": 40000, "loss": 0.0581, "lr": 0.18862557539507102, "epoch": 0.8152346517479784, "percentage": 41.71, "elapsed_time": "17:37:18", "remaining_time": "1 day, 0:37:26", "throughput": 333.23, "total_tokens": 21139200} {"current_steps": 16690, "total_steps": 40000, "loss": 0.0817, "lr": 0.18856865398840605, "epoch": 0.8154789534116728, "percentage": 41.73, "elapsed_time": "17:37:21", "remaining_time": "1 day, 0:36:44", "throughput": 333.3, "total_tokens": 21145120} {"current_steps": 16695, "total_steps": 40000, "loss": 0.0607, "lr": 0.18851172663396995, "epoch": 0.815723255075367, "percentage": 41.74, "elapsed_time": "17:37:24", "remaining_time": "1 day, 0:36:03", "throughput": 333.39, "total_tokens": 21151424} {"current_steps": 16700, "total_steps": 40000, "loss": 0.0533, "lr": 0.1884547933405416, "epoch": 0.8159675567390614, "percentage": 41.75, "elapsed_time": "17:37:27", "remaining_time": "1 day, 0:35:22", "throughput": 333.47, "total_tokens": 21157728} {"current_steps": 16705, "total_steps": 40000, "loss": 0.032, "lr": 0.1883978541169009, "epoch": 0.8162118584027557, "percentage": 41.76, "elapsed_time": "17:37:30", "remaining_time": "1 day, 0:34:41", "throughput": 333.55, "total_tokens": 21164192} {"current_steps": 16710, "total_steps": 40000, "loss": 0.0505, "lr": 0.18834090897182854, "epoch": 0.81645616006645, "percentage": 41.77, "elapsed_time": "17:37:33", "remaining_time": "1 day, 0:34:00", "throughput": 333.64, "total_tokens": 21170464} {"current_steps": 16715, "total_steps": 40000, "loss": 0.0952, "lr": 0.1882839579141062, "epoch": 0.8167004617301444, "percentage": 41.79, "elapsed_time": "17:37:36", "remaining_time": "1 day, 0:33:18", "throughput": 333.72, "total_tokens": 21176544} {"current_steps": 16720, "total_steps": 40000, "loss": 0.082, "lr": 0.18822700095251646, "epoch": 0.8169447633938387, "percentage": 41.8, "elapsed_time": "17:37:39", "remaining_time": "1 day, 0:32:37", "throughput": 333.8, "total_tokens": 21182656} {"current_steps": 16725, "total_steps": 40000, "loss": 0.073, "lr": 0.18817003809584273, "epoch": 0.8171890650575331, "percentage": 41.81, "elapsed_time": "17:37:42", "remaining_time": "1 day, 0:31:56", "throughput": 333.89, "total_tokens": 21189472} {"current_steps": 16730, "total_steps": 40000, "loss": 0.0767, "lr": 0.1881130693528695, "epoch": 0.8174333667212274, "percentage": 41.83, "elapsed_time": "17:37:45", "remaining_time": "1 day, 0:31:15", "throughput": 333.97, "total_tokens": 21195616} {"current_steps": 16735, "total_steps": 40000, "loss": 0.0663, "lr": 0.18805609473238197, "epoch": 0.8176776683849217, "percentage": 41.84, "elapsed_time": "17:37:49", "remaining_time": "1 day, 0:30:34", "throughput": 334.06, "total_tokens": 21202176} {"current_steps": 16740, "total_steps": 40000, "loss": 0.0855, "lr": 0.18799911424316643, "epoch": 0.817921970048616, "percentage": 41.85, "elapsed_time": "17:37:52", "remaining_time": "1 day, 0:29:53", "throughput": 334.14, "total_tokens": 21208640} {"current_steps": 16745, "total_steps": 40000, "loss": 0.068, "lr": 0.18794212789400994, "epoch": 0.8181662717123104, "percentage": 41.86, "elapsed_time": "17:37:55", "remaining_time": "1 day, 0:29:12", "throughput": 334.23, "total_tokens": 21215328} {"current_steps": 16750, "total_steps": 40000, "loss": 0.0594, "lr": 0.18788513569370052, "epoch": 0.8184105733760046, "percentage": 41.88, "elapsed_time": "17:37:58", "remaining_time": "1 day, 0:28:31", "throughput": 334.31, "total_tokens": 21221664} {"current_steps": 16755, "total_steps": 40000, "loss": 0.081, "lr": 0.1878281376510271, "epoch": 0.818654875039699, "percentage": 41.89, "elapsed_time": "17:38:01", "remaining_time": "1 day, 0:27:50", "throughput": 334.4, "total_tokens": 21227936} {"current_steps": 16760, "total_steps": 40000, "loss": 0.0489, "lr": 0.18777113377477941, "epoch": 0.8188991767033934, "percentage": 41.9, "elapsed_time": "17:38:04", "remaining_time": "1 day, 0:27:09", "throughput": 334.48, "total_tokens": 21234048} {"current_steps": 16765, "total_steps": 40000, "loss": 0.0444, "lr": 0.1877141240737483, "epoch": 0.8191434783670877, "percentage": 41.91, "elapsed_time": "17:38:07", "remaining_time": "1 day, 0:26:28", "throughput": 334.56, "total_tokens": 21240320} {"current_steps": 16770, "total_steps": 40000, "loss": 0.0637, "lr": 0.18765710855672527, "epoch": 0.819387780030782, "percentage": 41.93, "elapsed_time": "17:38:10", "remaining_time": "1 day, 0:25:48", "throughput": 334.65, "total_tokens": 21247104} {"current_steps": 16775, "total_steps": 40000, "loss": 0.0459, "lr": 0.18760008723250288, "epoch": 0.8196320816944763, "percentage": 41.94, "elapsed_time": "17:38:13", "remaining_time": "1 day, 0:25:07", "throughput": 334.73, "total_tokens": 21253248} {"current_steps": 16780, "total_steps": 40000, "loss": 0.0598, "lr": 0.18754306010987457, "epoch": 0.8198763833581707, "percentage": 41.95, "elapsed_time": "17:38:16", "remaining_time": "1 day, 0:24:26", "throughput": 334.81, "total_tokens": 21259200} {"current_steps": 16785, "total_steps": 40000, "loss": 0.0769, "lr": 0.18748602719763457, "epoch": 0.820120685021865, "percentage": 41.96, "elapsed_time": "17:38:19", "remaining_time": "1 day, 0:23:45", "throughput": 334.88, "total_tokens": 21265088} {"current_steps": 16790, "total_steps": 40000, "loss": 0.0589, "lr": 0.18742898850457804, "epoch": 0.8203649866855593, "percentage": 41.98, "elapsed_time": "17:38:23", "remaining_time": "1 day, 0:23:04", "throughput": 334.97, "total_tokens": 21271296} {"current_steps": 16795, "total_steps": 40000, "loss": 0.0446, "lr": 0.1873719440395012, "epoch": 0.8206092883492536, "percentage": 41.99, "elapsed_time": "17:38:26", "remaining_time": "1 day, 0:22:23", "throughput": 335.05, "total_tokens": 21277760} {"current_steps": 16800, "total_steps": 40000, "loss": 0.0633, "lr": 0.1873148938112009, "epoch": 0.820853590012948, "percentage": 42.0, "elapsed_time": "17:38:29", "remaining_time": "1 day, 0:21:42", "throughput": 335.12, "total_tokens": 21283328} {"current_steps": 16800, "total_steps": 40000, "eval_loss": 0.06929633021354675, "epoch": 0.820853590012948, "percentage": 42.0, "elapsed_time": "17:49:09", "remaining_time": "1 day, 0:36:27", "throughput": 331.78, "total_tokens": 21283328} {"current_steps": 16805, "total_steps": 40000, "loss": 0.0837, "lr": 0.18725783782847508, "epoch": 0.8210978916766423, "percentage": 42.01, "elapsed_time": "17:49:13", "remaining_time": "1 day, 0:35:47", "throughput": 331.86, "total_tokens": 21289824} {"current_steps": 16810, "total_steps": 40000, "loss": 0.0566, "lr": 0.1872007761001224, "epoch": 0.8213421933403366, "percentage": 42.02, "elapsed_time": "17:49:16", "remaining_time": "1 day, 0:35:06", "throughput": 331.95, "total_tokens": 21296544} {"current_steps": 16815, "total_steps": 40000, "loss": 0.0753, "lr": 0.1871437086349426, "epoch": 0.821586495004031, "percentage": 42.04, "elapsed_time": "17:49:19", "remaining_time": "1 day, 0:34:24", "throughput": 332.03, "total_tokens": 21302656} {"current_steps": 16820, "total_steps": 40000, "loss": 0.0763, "lr": 0.18708663544173615, "epoch": 0.8218307966677253, "percentage": 42.05, "elapsed_time": "17:49:22", "remaining_time": "1 day, 0:33:43", "throughput": 332.11, "total_tokens": 21309120} {"current_steps": 16825, "total_steps": 40000, "loss": 0.0873, "lr": 0.18702955652930442, "epoch": 0.8220750983314197, "percentage": 42.06, "elapsed_time": "17:49:25", "remaining_time": "1 day, 0:33:02", "throughput": 332.19, "total_tokens": 21315392} {"current_steps": 16830, "total_steps": 40000, "loss": 0.0437, "lr": 0.18697247190644972, "epoch": 0.8223193999951139, "percentage": 42.08, "elapsed_time": "17:49:28", "remaining_time": "1 day, 0:32:21", "throughput": 332.27, "total_tokens": 21321536} {"current_steps": 16835, "total_steps": 40000, "loss": 0.0761, "lr": 0.18691538158197527, "epoch": 0.8225637016588083, "percentage": 42.09, "elapsed_time": "17:49:31", "remaining_time": "1 day, 0:31:40", "throughput": 332.36, "total_tokens": 21328000} {"current_steps": 16840, "total_steps": 40000, "loss": 0.0761, "lr": 0.1868582855646851, "epoch": 0.8228080033225026, "percentage": 42.1, "elapsed_time": "17:49:34", "remaining_time": "1 day, 0:30:59", "throughput": 332.44, "total_tokens": 21334048} {"current_steps": 16845, "total_steps": 40000, "loss": 0.0495, "lr": 0.18680118386338404, "epoch": 0.823052304986197, "percentage": 42.11, "elapsed_time": "17:49:37", "remaining_time": "1 day, 0:30:18", "throughput": 332.52, "total_tokens": 21340512} {"current_steps": 16850, "total_steps": 40000, "loss": 0.052, "lr": 0.18674407648687794, "epoch": 0.8232966066498912, "percentage": 42.12, "elapsed_time": "17:49:40", "remaining_time": "1 day, 0:29:37", "throughput": 332.6, "total_tokens": 21346560} {"current_steps": 16855, "total_steps": 40000, "loss": 0.0557, "lr": 0.1866869634439736, "epoch": 0.8235409083135856, "percentage": 42.14, "elapsed_time": "17:49:44", "remaining_time": "1 day, 0:28:56", "throughput": 332.68, "total_tokens": 21352640} {"current_steps": 16860, "total_steps": 40000, "loss": 0.0436, "lr": 0.18662984474347838, "epoch": 0.82378520997728, "percentage": 42.15, "elapsed_time": "17:49:47", "remaining_time": "1 day, 0:28:15", "throughput": 332.76, "total_tokens": 21358976} {"current_steps": 16865, "total_steps": 40000, "loss": 0.0515, "lr": 0.1865727203942008, "epoch": 0.8240295116409743, "percentage": 42.16, "elapsed_time": "17:49:50", "remaining_time": "1 day, 0:27:34", "throughput": 332.84, "total_tokens": 21365152} {"current_steps": 16870, "total_steps": 40000, "loss": 0.0623, "lr": 0.1865155904049501, "epoch": 0.8242738133046686, "percentage": 42.18, "elapsed_time": "17:49:53", "remaining_time": "1 day, 0:26:53", "throughput": 332.92, "total_tokens": 21371040} {"current_steps": 16875, "total_steps": 40000, "loss": 0.0589, "lr": 0.1864584547845365, "epoch": 0.8245181149683629, "percentage": 42.19, "elapsed_time": "17:49:56", "remaining_time": "1 day, 0:26:12", "throughput": 333.0, "total_tokens": 21377248} {"current_steps": 16880, "total_steps": 40000, "loss": 0.0752, "lr": 0.186401313541771, "epoch": 0.8247624166320573, "percentage": 42.2, "elapsed_time": "17:49:59", "remaining_time": "1 day, 0:25:31", "throughput": 333.09, "total_tokens": 21383936} {"current_steps": 16885, "total_steps": 40000, "loss": 0.0675, "lr": 0.18634416668546552, "epoch": 0.8250067182957516, "percentage": 42.21, "elapsed_time": "17:50:02", "remaining_time": "1 day, 0:24:51", "throughput": 333.17, "total_tokens": 21390400} {"current_steps": 16890, "total_steps": 40000, "loss": 0.0417, "lr": 0.1862870142244328, "epoch": 0.8252510199594459, "percentage": 42.23, "elapsed_time": "17:50:05", "remaining_time": "1 day, 0:24:10", "throughput": 333.25, "total_tokens": 21396800} {"current_steps": 16895, "total_steps": 40000, "loss": 0.1002, "lr": 0.1862298561674865, "epoch": 0.8254953216231402, "percentage": 42.24, "elapsed_time": "17:50:08", "remaining_time": "1 day, 0:23:29", "throughput": 333.33, "total_tokens": 21402944} {"current_steps": 16900, "total_steps": 40000, "loss": 0.0963, "lr": 0.18617269252344104, "epoch": 0.8257396232868346, "percentage": 42.25, "elapsed_time": "17:50:11", "remaining_time": "1 day, 0:22:48", "throughput": 333.42, "total_tokens": 21409184} {"current_steps": 16905, "total_steps": 40000, "loss": 0.0588, "lr": 0.18611552330111186, "epoch": 0.8259839249505289, "percentage": 42.26, "elapsed_time": "17:50:14", "remaining_time": "1 day, 0:22:07", "throughput": 333.5, "total_tokens": 21415392} {"current_steps": 16910, "total_steps": 40000, "loss": 0.0534, "lr": 0.18605834850931507, "epoch": 0.8262282266142232, "percentage": 42.27, "elapsed_time": "17:50:17", "remaining_time": "1 day, 0:21:27", "throughput": 333.58, "total_tokens": 21421824} {"current_steps": 16915, "total_steps": 40000, "loss": 0.0422, "lr": 0.18600116815686787, "epoch": 0.8264725282779176, "percentage": 42.29, "elapsed_time": "17:50:21", "remaining_time": "1 day, 0:20:46", "throughput": 333.67, "total_tokens": 21428384} {"current_steps": 16920, "total_steps": 40000, "loss": 0.0647, "lr": 0.1859439822525881, "epoch": 0.8267168299416119, "percentage": 42.3, "elapsed_time": "17:50:24", "remaining_time": "1 day, 0:20:05", "throughput": 333.75, "total_tokens": 21434496} {"current_steps": 16925, "total_steps": 40000, "loss": 0.0704, "lr": 0.18588679080529455, "epoch": 0.8269611316053063, "percentage": 42.31, "elapsed_time": "17:50:27", "remaining_time": "1 day, 0:19:25", "throughput": 333.83, "total_tokens": 21440864} {"current_steps": 16930, "total_steps": 40000, "loss": 0.0721, "lr": 0.1858295938238069, "epoch": 0.8272054332690005, "percentage": 42.33, "elapsed_time": "17:50:30", "remaining_time": "1 day, 0:18:44", "throughput": 333.92, "total_tokens": 21447776} {"current_steps": 16935, "total_steps": 40000, "loss": 0.0869, "lr": 0.18577239131694562, "epoch": 0.8274497349326949, "percentage": 42.34, "elapsed_time": "17:50:33", "remaining_time": "1 day, 0:18:04", "throughput": 334.0, "total_tokens": 21454208} {"current_steps": 16940, "total_steps": 40000, "loss": 0.0866, "lr": 0.18571518329353204, "epoch": 0.8276940365963892, "percentage": 42.35, "elapsed_time": "17:50:36", "remaining_time": "1 day, 0:17:23", "throughput": 334.08, "total_tokens": 21460128} {"current_steps": 16945, "total_steps": 40000, "loss": 0.0709, "lr": 0.18565796976238838, "epoch": 0.8279383382600836, "percentage": 42.36, "elapsed_time": "17:50:39", "remaining_time": "1 day, 0:16:42", "throughput": 334.16, "total_tokens": 21466144} {"current_steps": 16950, "total_steps": 40000, "loss": 0.0693, "lr": 0.18560075073233764, "epoch": 0.8281826399237778, "percentage": 42.38, "elapsed_time": "17:50:42", "remaining_time": "1 day, 0:16:02", "throughput": 334.24, "total_tokens": 21472544} {"current_steps": 16955, "total_steps": 40000, "loss": 0.0418, "lr": 0.18554352621220377, "epoch": 0.8284269415874722, "percentage": 42.39, "elapsed_time": "17:50:45", "remaining_time": "1 day, 0:15:21", "throughput": 334.33, "total_tokens": 21479456} {"current_steps": 16960, "total_steps": 40000, "loss": 0.0496, "lr": 0.18548629621081153, "epoch": 0.8286712432511666, "percentage": 42.4, "elapsed_time": "17:50:48", "remaining_time": "1 day, 0:14:41", "throughput": 334.42, "total_tokens": 21485920} {"current_steps": 16965, "total_steps": 40000, "loss": 0.0678, "lr": 0.18542906073698645, "epoch": 0.8289155449148609, "percentage": 42.41, "elapsed_time": "17:50:51", "remaining_time": "1 day, 0:14:00", "throughput": 334.49, "total_tokens": 21491872} {"current_steps": 16970, "total_steps": 40000, "loss": 0.0903, "lr": 0.18537181979955494, "epoch": 0.8291598465785552, "percentage": 42.43, "elapsed_time": "17:50:54", "remaining_time": "1 day, 0:13:20", "throughput": 334.57, "total_tokens": 21497952} {"current_steps": 16975, "total_steps": 40000, "loss": 0.0697, "lr": 0.18531457340734434, "epoch": 0.8294041482422495, "percentage": 42.44, "elapsed_time": "17:50:57", "remaining_time": "1 day, 0:12:39", "throughput": 334.65, "total_tokens": 21504128} {"current_steps": 16980, "total_steps": 40000, "loss": 0.0265, "lr": 0.1852573215691827, "epoch": 0.8296484499059439, "percentage": 42.45, "elapsed_time": "17:51:00", "remaining_time": "1 day, 0:11:59", "throughput": 334.74, "total_tokens": 21510464} {"current_steps": 16985, "total_steps": 40000, "loss": 0.0734, "lr": 0.18520006429389904, "epoch": 0.8298927515696382, "percentage": 42.46, "elapsed_time": "17:51:04", "remaining_time": "1 day, 0:11:19", "throughput": 334.82, "total_tokens": 21516768} {"current_steps": 16990, "total_steps": 40000, "loss": 0.0746, "lr": 0.1851428015903231, "epoch": 0.8301370532333325, "percentage": 42.48, "elapsed_time": "17:51:07", "remaining_time": "1 day, 0:10:38", "throughput": 334.9, "total_tokens": 21522720} {"current_steps": 16995, "total_steps": 40000, "loss": 0.0735, "lr": 0.1850855334672855, "epoch": 0.8303813548970268, "percentage": 42.49, "elapsed_time": "17:51:10", "remaining_time": "1 day, 0:09:58", "throughput": 334.98, "total_tokens": 21528928} {"current_steps": 17000, "total_steps": 40000, "loss": 0.0453, "lr": 0.1850282599336178, "epoch": 0.8306256565607212, "percentage": 42.5, "elapsed_time": "17:51:13", "remaining_time": "1 day, 0:09:17", "throughput": 335.06, "total_tokens": 21535072} {"current_steps": 17000, "total_steps": 40000, "eval_loss": 0.06798975169658661, "epoch": 0.8306256565607212, "percentage": 42.5, "elapsed_time": "18:01:53", "remaining_time": "1 day, 0:23:44", "throughput": 331.75, "total_tokens": 21535072} {"current_steps": 17005, "total_steps": 40000, "loss": 0.0832, "lr": 0.18497098099815215, "epoch": 0.8308699582244156, "percentage": 42.51, "elapsed_time": "18:01:57", "remaining_time": "1 day, 0:23:04", "throughput": 331.83, "total_tokens": 21541152} {"current_steps": 17010, "total_steps": 40000, "loss": 0.1077, "lr": 0.18491369666972174, "epoch": 0.8311142598881098, "percentage": 42.52, "elapsed_time": "18:02:00", "remaining_time": "1 day, 0:22:23", "throughput": 331.91, "total_tokens": 21547552} {"current_steps": 17015, "total_steps": 40000, "loss": 0.0674, "lr": 0.1848564069571606, "epoch": 0.8313585615518042, "percentage": 42.54, "elapsed_time": "18:02:03", "remaining_time": "1 day, 0:21:42", "throughput": 332.0, "total_tokens": 21554272} {"current_steps": 17020, "total_steps": 40000, "loss": 0.052, "lr": 0.18479911186930348, "epoch": 0.8316028632154985, "percentage": 42.55, "elapsed_time": "18:02:06", "remaining_time": "1 day, 0:21:02", "throughput": 332.07, "total_tokens": 21560416} {"current_steps": 17025, "total_steps": 40000, "loss": 0.0461, "lr": 0.18474181141498597, "epoch": 0.8318471648791929, "percentage": 42.56, "elapsed_time": "18:02:09", "remaining_time": "1 day, 0:20:21", "throughput": 332.16, "total_tokens": 21566688} {"current_steps": 17030, "total_steps": 40000, "loss": 0.09, "lr": 0.18468450560304453, "epoch": 0.8320914665428871, "percentage": 42.58, "elapsed_time": "18:02:12", "remaining_time": "1 day, 0:19:40", "throughput": 332.24, "total_tokens": 21572896} {"current_steps": 17035, "total_steps": 40000, "loss": 0.0507, "lr": 0.1846271944423165, "epoch": 0.8323357682065815, "percentage": 42.59, "elapsed_time": "18:02:15", "remaining_time": "1 day, 0:19:00", "throughput": 332.31, "total_tokens": 21579040} {"current_steps": 17040, "total_steps": 40000, "loss": 0.042, "lr": 0.18456987794163993, "epoch": 0.8325800698702758, "percentage": 42.6, "elapsed_time": "18:02:18", "remaining_time": "1 day, 0:18:19", "throughput": 332.4, "total_tokens": 21585376} {"current_steps": 17045, "total_steps": 40000, "loss": 0.0563, "lr": 0.18451255610985373, "epoch": 0.8328243715339702, "percentage": 42.61, "elapsed_time": "18:02:21", "remaining_time": "1 day, 0:17:38", "throughput": 332.47, "total_tokens": 21591168} {"current_steps": 17050, "total_steps": 40000, "loss": 0.0775, "lr": 0.18445522895579766, "epoch": 0.8330686731976644, "percentage": 42.62, "elapsed_time": "18:02:24", "remaining_time": "1 day, 0:16:58", "throughput": 332.55, "total_tokens": 21597312} {"current_steps": 17055, "total_steps": 40000, "loss": 0.0809, "lr": 0.1843978964883123, "epoch": 0.8333129748613588, "percentage": 42.64, "elapsed_time": "18:02:27", "remaining_time": "1 day, 0:16:17", "throughput": 332.63, "total_tokens": 21603584} {"current_steps": 17060, "total_steps": 40000, "loss": 0.0482, "lr": 0.18434055871623906, "epoch": 0.8335572765250532, "percentage": 42.65, "elapsed_time": "18:02:30", "remaining_time": "1 day, 0:15:37", "throughput": 332.71, "total_tokens": 21609600} {"current_steps": 17065, "total_steps": 40000, "loss": 0.0866, "lr": 0.18428321564842007, "epoch": 0.8338015781887474, "percentage": 42.66, "elapsed_time": "18:02:34", "remaining_time": "1 day, 0:14:56", "throughput": 332.8, "total_tokens": 21616608} {"current_steps": 17070, "total_steps": 40000, "loss": 0.079, "lr": 0.18422586729369841, "epoch": 0.8340458798524418, "percentage": 42.68, "elapsed_time": "18:02:37", "remaining_time": "1 day, 0:14:16", "throughput": 332.87, "total_tokens": 21622336} {"current_steps": 17075, "total_steps": 40000, "loss": 0.0754, "lr": 0.1841685136609179, "epoch": 0.8342901815161361, "percentage": 42.69, "elapsed_time": "18:02:40", "remaining_time": "1 day, 0:13:35", "throughput": 332.95, "total_tokens": 21628736} {"current_steps": 17080, "total_steps": 40000, "loss": 0.0643, "lr": 0.18411115475892326, "epoch": 0.8345344831798305, "percentage": 42.7, "elapsed_time": "18:02:43", "remaining_time": "1 day, 0:12:55", "throughput": 333.03, "total_tokens": 21634592} {"current_steps": 17085, "total_steps": 40000, "loss": 0.0457, "lr": 0.18405379059655982, "epoch": 0.8347787848435247, "percentage": 42.71, "elapsed_time": "18:02:46", "remaining_time": "1 day, 0:12:15", "throughput": 333.11, "total_tokens": 21641056} {"current_steps": 17090, "total_steps": 40000, "loss": 0.0588, "lr": 0.1839964211826739, "epoch": 0.8350230865072191, "percentage": 42.73, "elapsed_time": "18:02:49", "remaining_time": "1 day, 0:11:34", "throughput": 333.2, "total_tokens": 21647584} {"current_steps": 17095, "total_steps": 40000, "loss": 0.0583, "lr": 0.18393904652611265, "epoch": 0.8352673881709134, "percentage": 42.74, "elapsed_time": "18:02:52", "remaining_time": "1 day, 0:10:54", "throughput": 333.28, "total_tokens": 21654016} {"current_steps": 17100, "total_steps": 40000, "loss": 0.0867, "lr": 0.18388166663572392, "epoch": 0.8355116898346078, "percentage": 42.75, "elapsed_time": "18:02:55", "remaining_time": "1 day, 0:10:13", "throughput": 333.35, "total_tokens": 21659776} {"current_steps": 17105, "total_steps": 40000, "loss": 0.08, "lr": 0.18382428152035643, "epoch": 0.8357559914983022, "percentage": 42.76, "elapsed_time": "18:02:58", "remaining_time": "1 day, 0:09:33", "throughput": 333.44, "total_tokens": 21666432} {"current_steps": 17110, "total_steps": 40000, "loss": 0.0753, "lr": 0.1837668911888596, "epoch": 0.8360002931619964, "percentage": 42.77, "elapsed_time": "18:03:01", "remaining_time": "1 day, 0:08:53", "throughput": 333.53, "total_tokens": 21673216} {"current_steps": 17115, "total_steps": 40000, "loss": 0.0902, "lr": 0.18370949565008388, "epoch": 0.8362445948256908, "percentage": 42.79, "elapsed_time": "18:03:04", "remaining_time": "1 day, 0:08:13", "throughput": 333.6, "total_tokens": 21679008} {"current_steps": 17120, "total_steps": 40000, "loss": 0.0525, "lr": 0.1836520949128803, "epoch": 0.8364888964893851, "percentage": 42.8, "elapsed_time": "18:03:07", "remaining_time": "1 day, 0:07:32", "throughput": 333.68, "total_tokens": 21685248} {"current_steps": 17125, "total_steps": 40000, "loss": 0.0614, "lr": 0.18359468898610076, "epoch": 0.8367331981530794, "percentage": 42.81, "elapsed_time": "18:03:10", "remaining_time": "1 day, 0:06:52", "throughput": 333.76, "total_tokens": 21691584} {"current_steps": 17130, "total_steps": 40000, "loss": 0.1036, "lr": 0.18353727787859797, "epoch": 0.8369774998167737, "percentage": 42.83, "elapsed_time": "18:03:14", "remaining_time": "1 day, 0:06:12", "throughput": 333.84, "total_tokens": 21697824} {"current_steps": 17135, "total_steps": 40000, "loss": 0.0745, "lr": 0.18347986159922552, "epoch": 0.8372218014804681, "percentage": 42.84, "elapsed_time": "18:03:17", "remaining_time": "1 day, 0:05:32", "throughput": 333.94, "total_tokens": 21704864} {"current_steps": 17140, "total_steps": 40000, "loss": 0.0748, "lr": 0.1834224401568377, "epoch": 0.8374661031441624, "percentage": 42.85, "elapsed_time": "18:03:20", "remaining_time": "1 day, 0:04:52", "throughput": 334.01, "total_tokens": 21710720} {"current_steps": 17145, "total_steps": 40000, "loss": 0.0588, "lr": 0.1833650135602896, "epoch": 0.8377104048078567, "percentage": 42.86, "elapsed_time": "18:03:23", "remaining_time": "1 day, 0:04:12", "throughput": 334.09, "total_tokens": 21716672} {"current_steps": 17150, "total_steps": 40000, "loss": 0.0795, "lr": 0.18330758181843707, "epoch": 0.8379547064715511, "percentage": 42.88, "elapsed_time": "18:03:26", "remaining_time": "1 day, 0:03:31", "throughput": 334.16, "total_tokens": 21722816} {"current_steps": 17155, "total_steps": 40000, "loss": 0.0893, "lr": 0.18325014494013686, "epoch": 0.8381990081352454, "percentage": 42.89, "elapsed_time": "18:03:29", "remaining_time": "1 day, 0:02:51", "throughput": 334.24, "total_tokens": 21728512} {"current_steps": 17160, "total_steps": 40000, "loss": 0.0603, "lr": 0.18319270293424647, "epoch": 0.8384433097989398, "percentage": 42.9, "elapsed_time": "18:03:32", "remaining_time": "1 day, 0:02:11", "throughput": 334.32, "total_tokens": 21735136} {"current_steps": 17165, "total_steps": 40000, "loss": 0.06, "lr": 0.18313525580962417, "epoch": 0.838687611462634, "percentage": 42.91, "elapsed_time": "18:03:35", "remaining_time": "1 day, 0:01:31", "throughput": 334.4, "total_tokens": 21741504} {"current_steps": 17170, "total_steps": 40000, "loss": 0.0602, "lr": 0.18307780357512896, "epoch": 0.8389319131263284, "percentage": 42.93, "elapsed_time": "18:03:38", "remaining_time": "1 day, 0:00:51", "throughput": 334.49, "total_tokens": 21748128} {"current_steps": 17175, "total_steps": 40000, "loss": 0.0593, "lr": 0.1830203462396208, "epoch": 0.8391762147900227, "percentage": 42.94, "elapsed_time": "18:03:41", "remaining_time": "1 day, 0:00:11", "throughput": 334.58, "total_tokens": 21754816} {"current_steps": 17180, "total_steps": 40000, "loss": 0.0781, "lr": 0.18296288381196033, "epoch": 0.8394205164537171, "percentage": 42.95, "elapsed_time": "18:03:45", "remaining_time": "23:59:32", "throughput": 334.66, "total_tokens": 21761408} {"current_steps": 17185, "total_steps": 40000, "loss": 0.052, "lr": 0.1829054163010089, "epoch": 0.8396648181174113, "percentage": 42.96, "elapsed_time": "18:03:48", "remaining_time": "23:58:52", "throughput": 334.74, "total_tokens": 21767712} {"current_steps": 17190, "total_steps": 40000, "loss": 0.0367, "lr": 0.18284794371562874, "epoch": 0.8399091197811057, "percentage": 42.98, "elapsed_time": "18:03:51", "remaining_time": "23:58:12", "throughput": 334.82, "total_tokens": 21774112} {"current_steps": 17195, "total_steps": 40000, "loss": 0.072, "lr": 0.18279046606468288, "epoch": 0.8401534214448, "percentage": 42.99, "elapsed_time": "18:03:54", "remaining_time": "23:57:32", "throughput": 334.9, "total_tokens": 21780000} {"current_steps": 17200, "total_steps": 40000, "loss": 0.0596, "lr": 0.1827329833570351, "epoch": 0.8403977231084944, "percentage": 43.0, "elapsed_time": "18:03:57", "remaining_time": "23:56:52", "throughput": 334.98, "total_tokens": 21786304} {"current_steps": 17200, "total_steps": 40000, "eval_loss": 0.06733512133359909, "epoch": 0.8403977231084944, "percentage": 43.0, "elapsed_time": "18:14:37", "remaining_time": "1 day, 0:11:01", "throughput": 331.72, "total_tokens": 21786304} {"current_steps": 17205, "total_steps": 40000, "loss": 0.0549, "lr": 0.18267549560154991, "epoch": 0.8406420247721887, "percentage": 43.01, "elapsed_time": "18:14:41", "remaining_time": "1 day, 0:10:21", "throughput": 331.79, "total_tokens": 21792576} {"current_steps": 17210, "total_steps": 40000, "loss": 0.0702, "lr": 0.18261800280709267, "epoch": 0.840886326435883, "percentage": 43.03, "elapsed_time": "18:14:44", "remaining_time": "1 day, 0:09:41", "throughput": 331.87, "total_tokens": 21798912} {"current_steps": 17215, "total_steps": 40000, "loss": 0.0618, "lr": 0.18256050498252957, "epoch": 0.8411306280995774, "percentage": 43.04, "elapsed_time": "18:14:47", "remaining_time": "1 day, 0:09:01", "throughput": 331.96, "total_tokens": 21805952} {"current_steps": 17220, "total_steps": 40000, "loss": 0.0686, "lr": 0.18250300213672735, "epoch": 0.8413749297632717, "percentage": 43.05, "elapsed_time": "18:14:50", "remaining_time": "1 day, 0:08:20", "throughput": 332.04, "total_tokens": 21812128} {"current_steps": 17225, "total_steps": 40000, "loss": 0.0686, "lr": 0.18244549427855378, "epoch": 0.841619231426966, "percentage": 43.06, "elapsed_time": "18:14:53", "remaining_time": "1 day, 0:07:40", "throughput": 332.12, "total_tokens": 21818240} {"current_steps": 17230, "total_steps": 40000, "loss": 0.048, "lr": 0.1823879814168772, "epoch": 0.8418635330906603, "percentage": 43.08, "elapsed_time": "18:14:56", "remaining_time": "1 day, 0:07:00", "throughput": 332.2, "total_tokens": 21824448} {"current_steps": 17235, "total_steps": 40000, "loss": 0.0946, "lr": 0.18233046356056692, "epoch": 0.8421078347543547, "percentage": 43.09, "elapsed_time": "18:14:59", "remaining_time": "1 day, 0:06:20", "throughput": 332.28, "total_tokens": 21830656} {"current_steps": 17240, "total_steps": 40000, "loss": 0.0627, "lr": 0.18227294071849284, "epoch": 0.842352136418049, "percentage": 43.1, "elapsed_time": "18:15:03", "remaining_time": "1 day, 0:05:40", "throughput": 332.36, "total_tokens": 21837056} {"current_steps": 17245, "total_steps": 40000, "loss": 0.0442, "lr": 0.18221541289952578, "epoch": 0.8425964380817433, "percentage": 43.11, "elapsed_time": "18:15:06", "remaining_time": "1 day, 0:05:00", "throughput": 332.45, "total_tokens": 21843872} {"current_steps": 17250, "total_steps": 40000, "loss": 0.079, "lr": 0.18215788011253717, "epoch": 0.8428407397454377, "percentage": 43.12, "elapsed_time": "18:15:09", "remaining_time": "1 day, 0:04:20", "throughput": 332.53, "total_tokens": 21850368} {"current_steps": 17255, "total_steps": 40000, "loss": 0.0488, "lr": 0.18210034236639935, "epoch": 0.843085041409132, "percentage": 43.14, "elapsed_time": "18:15:12", "remaining_time": "1 day, 0:03:40", "throughput": 332.62, "total_tokens": 21857056} {"current_steps": 17260, "total_steps": 40000, "loss": 0.0722, "lr": 0.1820427996699853, "epoch": 0.8433293430728264, "percentage": 43.15, "elapsed_time": "18:15:15", "remaining_time": "1 day, 0:03:00", "throughput": 332.7, "total_tokens": 21863328} {"current_steps": 17265, "total_steps": 40000, "loss": 0.0578, "lr": 0.1819852520321689, "epoch": 0.8435736447365206, "percentage": 43.16, "elapsed_time": "18:15:18", "remaining_time": "1 day, 0:02:20", "throughput": 332.77, "total_tokens": 21869376} {"current_steps": 17270, "total_steps": 40000, "loss": 0.0448, "lr": 0.18192769946182466, "epoch": 0.843817946400215, "percentage": 43.18, "elapsed_time": "18:15:21", "remaining_time": "1 day, 0:01:40", "throughput": 332.85, "total_tokens": 21875776} {"current_steps": 17275, "total_steps": 40000, "loss": 0.0413, "lr": 0.18187014196782794, "epoch": 0.8440622480639093, "percentage": 43.19, "elapsed_time": "18:15:24", "remaining_time": "1 day, 0:01:00", "throughput": 332.93, "total_tokens": 21882080} {"current_steps": 17280, "total_steps": 40000, "loss": 0.0681, "lr": 0.18181257955905486, "epoch": 0.8443065497276037, "percentage": 43.2, "elapsed_time": "18:15:28", "remaining_time": "1 day, 0:00:20", "throughput": 333.02, "total_tokens": 21888896} {"current_steps": 17285, "total_steps": 40000, "loss": 0.0667, "lr": 0.18175501224438217, "epoch": 0.8445508513912979, "percentage": 43.21, "elapsed_time": "18:15:31", "remaining_time": "23:59:40", "throughput": 333.1, "total_tokens": 21895104} {"current_steps": 17290, "total_steps": 40000, "loss": 0.0574, "lr": 0.18169744003268756, "epoch": 0.8447951530549923, "percentage": 43.23, "elapsed_time": "18:15:34", "remaining_time": "23:59:00", "throughput": 333.18, "total_tokens": 21901344} {"current_steps": 17295, "total_steps": 40000, "loss": 0.0861, "lr": 0.18163986293284937, "epoch": 0.8450394547186867, "percentage": 43.24, "elapsed_time": "18:15:37", "remaining_time": "23:58:20", "throughput": 333.26, "total_tokens": 21907584} {"current_steps": 17300, "total_steps": 40000, "loss": 0.0818, "lr": 0.18158228095374673, "epoch": 0.845283756382381, "percentage": 43.25, "elapsed_time": "18:15:40", "remaining_time": "23:57:40", "throughput": 333.34, "total_tokens": 21913984} {"current_steps": 17305, "total_steps": 40000, "loss": 0.0712, "lr": 0.18152469410425945, "epoch": 0.8455280580460753, "percentage": 43.26, "elapsed_time": "18:15:43", "remaining_time": "23:57:00", "throughput": 333.42, "total_tokens": 21919968} {"current_steps": 17310, "total_steps": 40000, "loss": 0.0583, "lr": 0.18146710239326813, "epoch": 0.8457723597097696, "percentage": 43.28, "elapsed_time": "18:15:46", "remaining_time": "23:56:20", "throughput": 333.5, "total_tokens": 21926400} {"current_steps": 17315, "total_steps": 40000, "loss": 0.0546, "lr": 0.18140950582965423, "epoch": 0.846016661373464, "percentage": 43.29, "elapsed_time": "18:15:49", "remaining_time": "23:55:40", "throughput": 333.58, "total_tokens": 21932640} {"current_steps": 17320, "total_steps": 40000, "loss": 0.0645, "lr": 0.1813519044222998, "epoch": 0.8462609630371583, "percentage": 43.3, "elapsed_time": "18:15:52", "remaining_time": "23:55:00", "throughput": 333.66, "total_tokens": 21938656} {"current_steps": 17325, "total_steps": 40000, "loss": 0.0689, "lr": 0.18129429818008772, "epoch": 0.8465052647008526, "percentage": 43.31, "elapsed_time": "18:15:55", "remaining_time": "23:54:21", "throughput": 333.74, "total_tokens": 21945024} {"current_steps": 17330, "total_steps": 40000, "loss": 0.0859, "lr": 0.18123668711190163, "epoch": 0.8467495663645469, "percentage": 43.33, "elapsed_time": "18:15:58", "remaining_time": "23:53:41", "throughput": 333.82, "total_tokens": 21951616} {"current_steps": 17335, "total_steps": 40000, "loss": 0.0599, "lr": 0.18117907122662583, "epoch": 0.8469938680282413, "percentage": 43.34, "elapsed_time": "18:16:01", "remaining_time": "23:53:01", "throughput": 333.9, "total_tokens": 21957952} {"current_steps": 17340, "total_steps": 40000, "loss": 0.0546, "lr": 0.1811214505331454, "epoch": 0.8472381696919355, "percentage": 43.35, "elapsed_time": "18:16:04", "remaining_time": "23:52:21", "throughput": 333.98, "total_tokens": 21964480} {"current_steps": 17345, "total_steps": 40000, "loss": 0.0706, "lr": 0.1810638250403462, "epoch": 0.8474824713556299, "percentage": 43.36, "elapsed_time": "18:16:07", "remaining_time": "23:51:42", "throughput": 334.06, "total_tokens": 21970400} {"current_steps": 17350, "total_steps": 40000, "loss": 0.0645, "lr": 0.1810061947571148, "epoch": 0.8477267730193243, "percentage": 43.38, "elapsed_time": "18:16:10", "remaining_time": "23:51:02", "throughput": 334.13, "total_tokens": 21976256} {"current_steps": 17355, "total_steps": 40000, "loss": 0.0591, "lr": 0.1809485596923385, "epoch": 0.8479710746830186, "percentage": 43.39, "elapsed_time": "18:16:14", "remaining_time": "23:50:22", "throughput": 334.21, "total_tokens": 21982272} {"current_steps": 17360, "total_steps": 40000, "loss": 0.0624, "lr": 0.18089091985490546, "epoch": 0.848215376346713, "percentage": 43.4, "elapsed_time": "18:16:17", "remaining_time": "23:49:43", "throughput": 334.29, "total_tokens": 21988512} {"current_steps": 17365, "total_steps": 40000, "loss": 0.0638, "lr": 0.18083327525370432, "epoch": 0.8484596780104072, "percentage": 43.41, "elapsed_time": "18:16:20", "remaining_time": "23:49:03", "throughput": 334.37, "total_tokens": 21994656} {"current_steps": 17370, "total_steps": 40000, "loss": 0.0715, "lr": 0.18077562589762464, "epoch": 0.8487039796741016, "percentage": 43.43, "elapsed_time": "18:16:23", "remaining_time": "23:48:23", "throughput": 334.45, "total_tokens": 22000928} {"current_steps": 17375, "total_steps": 40000, "loss": 0.0628, "lr": 0.1807179717955567, "epoch": 0.8489482813377959, "percentage": 43.44, "elapsed_time": "18:16:26", "remaining_time": "23:47:44", "throughput": 334.53, "total_tokens": 22007520} {"current_steps": 17380, "total_steps": 40000, "loss": 0.0773, "lr": 0.1806603129563915, "epoch": 0.8491925830014903, "percentage": 43.45, "elapsed_time": "18:16:29", "remaining_time": "23:47:04", "throughput": 334.61, "total_tokens": 22013664} {"current_steps": 17385, "total_steps": 40000, "loss": 0.0491, "lr": 0.1806026493890208, "epoch": 0.8494368846651845, "percentage": 43.46, "elapsed_time": "18:16:32", "remaining_time": "23:46:25", "throughput": 334.69, "total_tokens": 22020064} {"current_steps": 17390, "total_steps": 40000, "loss": 0.0881, "lr": 0.18054498110233688, "epoch": 0.8496811863288789, "percentage": 43.48, "elapsed_time": "18:16:35", "remaining_time": "23:45:45", "throughput": 334.77, "total_tokens": 22026336} {"current_steps": 17395, "total_steps": 40000, "loss": 0.0908, "lr": 0.1804873081052331, "epoch": 0.8499254879925733, "percentage": 43.49, "elapsed_time": "18:16:38", "remaining_time": "23:45:06", "throughput": 334.85, "total_tokens": 22032864} {"current_steps": 17400, "total_steps": 40000, "loss": 0.0473, "lr": 0.18042963040660326, "epoch": 0.8501697896562675, "percentage": 43.5, "elapsed_time": "18:16:41", "remaining_time": "23:44:26", "throughput": 334.93, "total_tokens": 22039232} {"current_steps": 17400, "total_steps": 40000, "eval_loss": 0.06643195450305939, "epoch": 0.8501697896562675, "percentage": 43.5, "elapsed_time": "18:27:21", "remaining_time": "23:58:18", "throughput": 331.71, "total_tokens": 22039232} {"current_steps": 17405, "total_steps": 40000, "loss": 0.0674, "lr": 0.180371948015342, "epoch": 0.8504140913199619, "percentage": 43.51, "elapsed_time": "18:27:25", "remaining_time": "23:57:39", "throughput": 331.78, "total_tokens": 22045472} {"current_steps": 17410, "total_steps": 40000, "loss": 0.0592, "lr": 0.18031426094034472, "epoch": 0.8506583929836562, "percentage": 43.53, "elapsed_time": "18:27:28", "remaining_time": "23:56:59", "throughput": 331.86, "total_tokens": 22051936} {"current_steps": 17415, "total_steps": 40000, "loss": 0.0631, "lr": 0.18025656919050737, "epoch": 0.8509026946473506, "percentage": 43.54, "elapsed_time": "18:27:32", "remaining_time": "23:56:19", "throughput": 331.95, "total_tokens": 22058496} {"current_steps": 17420, "total_steps": 40000, "loss": 0.0736, "lr": 0.18019887277472688, "epoch": 0.8511469963110448, "percentage": 43.55, "elapsed_time": "18:27:35", "remaining_time": "23:55:39", "throughput": 332.02, "total_tokens": 22064448} {"current_steps": 17425, "total_steps": 40000, "loss": 0.0512, "lr": 0.18014117170190067, "epoch": 0.8513912979747392, "percentage": 43.56, "elapsed_time": "18:27:38", "remaining_time": "23:55:00", "throughput": 332.1, "total_tokens": 22070848} {"current_steps": 17430, "total_steps": 40000, "loss": 0.0705, "lr": 0.18008346598092703, "epoch": 0.8516355996384335, "percentage": 43.58, "elapsed_time": "18:27:41", "remaining_time": "23:54:20", "throughput": 332.18, "total_tokens": 22077184} {"current_steps": 17435, "total_steps": 40000, "loss": 0.0428, "lr": 0.18002575562070489, "epoch": 0.8518799013021279, "percentage": 43.59, "elapsed_time": "18:27:44", "remaining_time": "23:53:40", "throughput": 332.26, "total_tokens": 22083616} {"current_steps": 17440, "total_steps": 40000, "loss": 0.0701, "lr": 0.1799680406301339, "epoch": 0.8521242029658221, "percentage": 43.6, "elapsed_time": "18:27:47", "remaining_time": "23:53:00", "throughput": 332.34, "total_tokens": 22090112} {"current_steps": 17445, "total_steps": 40000, "loss": 0.0409, "lr": 0.17991032101811447, "epoch": 0.8523685046295165, "percentage": 43.61, "elapsed_time": "18:27:50", "remaining_time": "23:52:21", "throughput": 332.42, "total_tokens": 22096192} {"current_steps": 17450, "total_steps": 40000, "loss": 0.0899, "lr": 0.1798525967935476, "epoch": 0.8526128062932109, "percentage": 43.62, "elapsed_time": "18:27:53", "remaining_time": "23:51:41", "throughput": 332.5, "total_tokens": 22102336} {"current_steps": 17455, "total_steps": 40000, "loss": 0.0538, "lr": 0.17979486796533517, "epoch": 0.8528571079569052, "percentage": 43.64, "elapsed_time": "18:27:56", "remaining_time": "23:51:01", "throughput": 332.57, "total_tokens": 22108416} {"current_steps": 17460, "total_steps": 40000, "loss": 0.0446, "lr": 0.1797371345423797, "epoch": 0.8531014096205995, "percentage": 43.65, "elapsed_time": "18:27:59", "remaining_time": "23:50:22", "throughput": 332.66, "total_tokens": 22114944} {"current_steps": 17465, "total_steps": 40000, "loss": 0.0519, "lr": 0.17967939653358436, "epoch": 0.8533457112842938, "percentage": 43.66, "elapsed_time": "18:28:02", "remaining_time": "23:49:42", "throughput": 332.74, "total_tokens": 22121536} {"current_steps": 17470, "total_steps": 40000, "loss": 0.0323, "lr": 0.17962165394785315, "epoch": 0.8535900129479882, "percentage": 43.68, "elapsed_time": "18:28:05", "remaining_time": "23:49:02", "throughput": 332.81, "total_tokens": 22127392} {"current_steps": 17475, "total_steps": 40000, "loss": 0.0709, "lr": 0.17956390679409057, "epoch": 0.8538343146116825, "percentage": 43.69, "elapsed_time": "18:28:08", "remaining_time": "23:48:23", "throughput": 332.89, "total_tokens": 22133504} {"current_steps": 17480, "total_steps": 40000, "loss": 0.0736, "lr": 0.1795061550812021, "epoch": 0.8540786162753768, "percentage": 43.7, "elapsed_time": "18:28:12", "remaining_time": "23:47:43", "throughput": 332.98, "total_tokens": 22140416} {"current_steps": 17485, "total_steps": 40000, "loss": 0.0686, "lr": 0.1794483988180937, "epoch": 0.8543229179390711, "percentage": 43.71, "elapsed_time": "18:28:15", "remaining_time": "23:47:04", "throughput": 333.06, "total_tokens": 22146560} {"current_steps": 17490, "total_steps": 40000, "loss": 0.0561, "lr": 0.17939063801367214, "epoch": 0.8545672196027655, "percentage": 43.73, "elapsed_time": "18:28:18", "remaining_time": "23:46:24", "throughput": 333.13, "total_tokens": 22152768} {"current_steps": 17495, "total_steps": 40000, "loss": 0.0837, "lr": 0.17933287267684483, "epoch": 0.8548115212664599, "percentage": 43.74, "elapsed_time": "18:28:21", "remaining_time": "23:45:45", "throughput": 333.22, "total_tokens": 22159776} {"current_steps": 17500, "total_steps": 40000, "loss": 0.0439, "lr": 0.17927510281651995, "epoch": 0.8550558229301541, "percentage": 43.75, "elapsed_time": "18:28:24", "remaining_time": "23:45:05", "throughput": 333.3, "total_tokens": 22165632} {"current_steps": 17505, "total_steps": 40000, "loss": 0.0831, "lr": 0.17921732844160634, "epoch": 0.8553001245938485, "percentage": 43.76, "elapsed_time": "18:28:27", "remaining_time": "23:44:26", "throughput": 333.38, "total_tokens": 22172288} {"current_steps": 17510, "total_steps": 40000, "loss": 0.0613, "lr": 0.17915954956101351, "epoch": 0.8555444262575428, "percentage": 43.77, "elapsed_time": "18:28:30", "remaining_time": "23:43:46", "throughput": 333.46, "total_tokens": 22178432} {"current_steps": 17515, "total_steps": 40000, "loss": 0.0438, "lr": 0.17910176618365165, "epoch": 0.8557887279212372, "percentage": 43.79, "elapsed_time": "18:28:33", "remaining_time": "23:43:07", "throughput": 333.54, "total_tokens": 22184704} {"current_steps": 17520, "total_steps": 40000, "loss": 0.0543, "lr": 0.17904397831843177, "epoch": 0.8560330295849314, "percentage": 43.8, "elapsed_time": "18:28:36", "remaining_time": "23:42:27", "throughput": 333.61, "total_tokens": 22190912} {"current_steps": 17525, "total_steps": 40000, "loss": 0.0824, "lr": 0.17898618597426547, "epoch": 0.8562773312486258, "percentage": 43.81, "elapsed_time": "18:28:39", "remaining_time": "23:41:48", "throughput": 333.69, "total_tokens": 22197120} {"current_steps": 17530, "total_steps": 40000, "loss": 0.0603, "lr": 0.17892838916006495, "epoch": 0.8565216329123201, "percentage": 43.82, "elapsed_time": "18:28:42", "remaining_time": "23:41:09", "throughput": 333.77, "total_tokens": 22203424} {"current_steps": 17535, "total_steps": 40000, "loss": 0.0668, "lr": 0.17887058788474333, "epoch": 0.8567659345760145, "percentage": 43.84, "elapsed_time": "18:28:45", "remaining_time": "23:40:29", "throughput": 333.85, "total_tokens": 22209792} {"current_steps": 17540, "total_steps": 40000, "loss": 0.0595, "lr": 0.17881278215721427, "epoch": 0.8570102362397088, "percentage": 43.85, "elapsed_time": "18:28:48", "remaining_time": "23:39:50", "throughput": 333.93, "total_tokens": 22215904} {"current_steps": 17545, "total_steps": 40000, "loss": 0.0816, "lr": 0.1787549719863921, "epoch": 0.8572545379034031, "percentage": 43.86, "elapsed_time": "18:28:51", "remaining_time": "23:39:10", "throughput": 334.01, "total_tokens": 22222176} {"current_steps": 17550, "total_steps": 40000, "loss": 0.0772, "lr": 0.17869715738119188, "epoch": 0.8574988395670975, "percentage": 43.88, "elapsed_time": "18:28:54", "remaining_time": "23:38:31", "throughput": 334.08, "total_tokens": 22227968} {"current_steps": 17555, "total_steps": 40000, "loss": 0.0922, "lr": 0.17863933835052936, "epoch": 0.8577431412307918, "percentage": 43.89, "elapsed_time": "18:28:57", "remaining_time": "23:37:52", "throughput": 334.15, "total_tokens": 22233920} {"current_steps": 17560, "total_steps": 40000, "loss": 0.0278, "lr": 0.17858151490332097, "epoch": 0.8579874428944861, "percentage": 43.9, "elapsed_time": "18:29:00", "remaining_time": "23:37:12", "throughput": 334.23, "total_tokens": 22240160} {"current_steps": 17565, "total_steps": 40000, "loss": 0.0856, "lr": 0.17852368704848381, "epoch": 0.8582317445581804, "percentage": 43.91, "elapsed_time": "18:29:03", "remaining_time": "23:36:33", "throughput": 334.31, "total_tokens": 22246528} {"current_steps": 17570, "total_steps": 40000, "loss": 0.0871, "lr": 0.17846585479493565, "epoch": 0.8584760462218748, "percentage": 43.92, "elapsed_time": "18:29:06", "remaining_time": "23:35:54", "throughput": 334.39, "total_tokens": 22252736} {"current_steps": 17575, "total_steps": 40000, "loss": 0.0406, "lr": 0.178408018151595, "epoch": 0.8587203478855691, "percentage": 43.94, "elapsed_time": "18:29:10", "remaining_time": "23:35:15", "throughput": 334.47, "total_tokens": 22259008} {"current_steps": 17580, "total_steps": 40000, "loss": 0.0644, "lr": 0.17835017712738085, "epoch": 0.8589646495492634, "percentage": 43.95, "elapsed_time": "18:29:13", "remaining_time": "23:34:36", "throughput": 334.55, "total_tokens": 22265184} {"current_steps": 17585, "total_steps": 40000, "loss": 0.0699, "lr": 0.17829233173121323, "epoch": 0.8592089512129577, "percentage": 43.96, "elapsed_time": "18:29:16", "remaining_time": "23:33:57", "throughput": 334.63, "total_tokens": 22271648} {"current_steps": 17590, "total_steps": 40000, "loss": 0.0806, "lr": 0.17823448197201244, "epoch": 0.8594532528766521, "percentage": 43.97, "elapsed_time": "18:29:19", "remaining_time": "23:33:17", "throughput": 334.71, "total_tokens": 22278208} {"current_steps": 17595, "total_steps": 40000, "loss": 0.0776, "lr": 0.1781766278586997, "epoch": 0.8596975545403465, "percentage": 43.99, "elapsed_time": "18:29:22", "remaining_time": "23:32:38", "throughput": 334.79, "total_tokens": 22284192} {"current_steps": 17600, "total_steps": 40000, "loss": 0.0471, "lr": 0.1781187694001969, "epoch": 0.8599418562040407, "percentage": 44.0, "elapsed_time": "18:29:25", "remaining_time": "23:31:59", "throughput": 334.87, "total_tokens": 22290976} {"current_steps": 17600, "total_steps": 40000, "eval_loss": 0.0661223754286766, "epoch": 0.8599418562040407, "percentage": 44.0, "elapsed_time": "18:40:05", "remaining_time": "23:45:34", "throughput": 331.68, "total_tokens": 22290976} {"current_steps": 17605, "total_steps": 40000, "loss": 0.0419, "lr": 0.1780609066054265, "epoch": 0.8601861578677351, "percentage": 44.01, "elapsed_time": "18:40:09", "remaining_time": "23:44:56", "throughput": 331.76, "total_tokens": 22297216} {"current_steps": 17610, "total_steps": 40000, "loss": 0.0659, "lr": 0.17800303948331164, "epoch": 0.8604304595314294, "percentage": 44.02, "elapsed_time": "18:40:12", "remaining_time": "23:44:16", "throughput": 331.83, "total_tokens": 22303296} {"current_steps": 17615, "total_steps": 40000, "loss": 0.0872, "lr": 0.1779451680427762, "epoch": 0.8606747611951238, "percentage": 44.04, "elapsed_time": "18:40:15", "remaining_time": "23:43:37", "throughput": 331.91, "total_tokens": 22309792} {"current_steps": 17620, "total_steps": 40000, "loss": 0.0542, "lr": 0.17788729229274464, "epoch": 0.860919062858818, "percentage": 44.05, "elapsed_time": "18:40:18", "remaining_time": "23:42:57", "throughput": 331.99, "total_tokens": 22316128} {"current_steps": 17625, "total_steps": 40000, "loss": 0.0609, "lr": 0.17782941224214222, "epoch": 0.8611633645225124, "percentage": 44.06, "elapsed_time": "18:40:22", "remaining_time": "23:42:18", "throughput": 332.07, "total_tokens": 22322656} {"current_steps": 17630, "total_steps": 40000, "loss": 0.0274, "lr": 0.17777152789989464, "epoch": 0.8614076661862067, "percentage": 44.07, "elapsed_time": "18:40:25", "remaining_time": "23:41:39", "throughput": 332.15, "total_tokens": 22328960} {"current_steps": 17635, "total_steps": 40000, "loss": 0.1068, "lr": 0.17771363927492845, "epoch": 0.8616519678499011, "percentage": 44.09, "elapsed_time": "18:40:28", "remaining_time": "23:40:59", "throughput": 332.23, "total_tokens": 22335552} {"current_steps": 17640, "total_steps": 40000, "loss": 0.0449, "lr": 0.17765574637617085, "epoch": 0.8618962695135954, "percentage": 44.1, "elapsed_time": "18:40:31", "remaining_time": "23:40:20", "throughput": 332.31, "total_tokens": 22341664} {"current_steps": 17645, "total_steps": 40000, "loss": 0.087, "lr": 0.17759784921254962, "epoch": 0.8621405711772897, "percentage": 44.11, "elapsed_time": "18:40:34", "remaining_time": "23:39:41", "throughput": 332.39, "total_tokens": 22348128} {"current_steps": 17650, "total_steps": 40000, "loss": 0.0633, "lr": 0.1775399477929932, "epoch": 0.8623848728409841, "percentage": 44.12, "elapsed_time": "18:40:37", "remaining_time": "23:39:02", "throughput": 332.47, "total_tokens": 22354720} {"current_steps": 17655, "total_steps": 40000, "loss": 0.0696, "lr": 0.17748204212643076, "epoch": 0.8626291745046784, "percentage": 44.14, "elapsed_time": "18:40:40", "remaining_time": "23:38:22", "throughput": 332.55, "total_tokens": 22360672} {"current_steps": 17660, "total_steps": 40000, "loss": 0.0605, "lr": 0.17742413222179204, "epoch": 0.8628734761683727, "percentage": 44.15, "elapsed_time": "18:40:43", "remaining_time": "23:37:43", "throughput": 332.62, "total_tokens": 22366816} {"current_steps": 17665, "total_steps": 40000, "loss": 0.0664, "lr": 0.17736621808800754, "epoch": 0.863117777832067, "percentage": 44.16, "elapsed_time": "18:40:46", "remaining_time": "23:37:04", "throughput": 332.71, "total_tokens": 22373376} {"current_steps": 17670, "total_steps": 40000, "loss": 0.0621, "lr": 0.17730829973400827, "epoch": 0.8633620794957614, "percentage": 44.17, "elapsed_time": "18:40:49", "remaining_time": "23:36:25", "throughput": 332.78, "total_tokens": 22379488} {"current_steps": 17675, "total_steps": 40000, "loss": 0.1226, "lr": 0.17725037716872602, "epoch": 0.8636063811594556, "percentage": 44.19, "elapsed_time": "18:40:52", "remaining_time": "23:35:45", "throughput": 332.86, "total_tokens": 22385536} {"current_steps": 17680, "total_steps": 40000, "loss": 0.0685, "lr": 0.17719245040109313, "epoch": 0.86385068282315, "percentage": 44.2, "elapsed_time": "18:40:55", "remaining_time": "23:35:06", "throughput": 332.94, "total_tokens": 22392128} {"current_steps": 17685, "total_steps": 40000, "loss": 0.043, "lr": 0.17713451944004271, "epoch": 0.8640949844868444, "percentage": 44.21, "elapsed_time": "18:40:59", "remaining_time": "23:34:27", "throughput": 333.02, "total_tokens": 22398688} {"current_steps": 17690, "total_steps": 40000, "loss": 0.0646, "lr": 0.17707658429450843, "epoch": 0.8643392861505387, "percentage": 44.22, "elapsed_time": "18:41:02", "remaining_time": "23:33:48", "throughput": 333.1, "total_tokens": 22405280} {"current_steps": 17695, "total_steps": 40000, "loss": 0.0545, "lr": 0.1770186449734245, "epoch": 0.8645835878142331, "percentage": 44.24, "elapsed_time": "18:41:05", "remaining_time": "23:33:09", "throughput": 333.19, "total_tokens": 22411968} {"current_steps": 17700, "total_steps": 40000, "loss": 0.08, "lr": 0.17696070148572599, "epoch": 0.8648278894779273, "percentage": 44.25, "elapsed_time": "18:41:08", "remaining_time": "23:32:30", "throughput": 333.26, "total_tokens": 22418080} {"current_steps": 17705, "total_steps": 40000, "loss": 0.1011, "lr": 0.17690275384034856, "epoch": 0.8650721911416217, "percentage": 44.26, "elapsed_time": "18:41:11", "remaining_time": "23:31:51", "throughput": 333.34, "total_tokens": 22424256} {"current_steps": 17710, "total_steps": 40000, "loss": 0.058, "lr": 0.17684480204622835, "epoch": 0.865316492805316, "percentage": 44.27, "elapsed_time": "18:41:14", "remaining_time": "23:31:12", "throughput": 333.42, "total_tokens": 22430816} {"current_steps": 17715, "total_steps": 40000, "loss": 0.0562, "lr": 0.1767868461123023, "epoch": 0.8655607944690104, "percentage": 44.29, "elapsed_time": "18:41:17", "remaining_time": "23:30:33", "throughput": 333.51, "total_tokens": 22437536} {"current_steps": 17720, "total_steps": 40000, "loss": 0.06, "lr": 0.176728886047508, "epoch": 0.8658050961327046, "percentage": 44.3, "elapsed_time": "18:41:20", "remaining_time": "23:29:54", "throughput": 333.59, "total_tokens": 22443936} {"current_steps": 17725, "total_steps": 40000, "loss": 0.0683, "lr": 0.17667092186078362, "epoch": 0.866049397796399, "percentage": 44.31, "elapsed_time": "18:41:23", "remaining_time": "23:29:15", "throughput": 333.66, "total_tokens": 22450016} {"current_steps": 17730, "total_steps": 40000, "loss": 0.0711, "lr": 0.17661295356106785, "epoch": 0.8662936994600933, "percentage": 44.32, "elapsed_time": "18:41:26", "remaining_time": "23:28:36", "throughput": 333.74, "total_tokens": 22456096} {"current_steps": 17735, "total_steps": 40000, "loss": 0.0709, "lr": 0.1765549811573002, "epoch": 0.8665380011237876, "percentage": 44.34, "elapsed_time": "18:41:30", "remaining_time": "23:27:57", "throughput": 333.82, "total_tokens": 22462432} {"current_steps": 17740, "total_steps": 40000, "loss": 0.0387, "lr": 0.17649700465842078, "epoch": 0.866782302787482, "percentage": 44.35, "elapsed_time": "18:41:33", "remaining_time": "23:27:18", "throughput": 333.89, "total_tokens": 22468576} {"current_steps": 17745, "total_steps": 40000, "loss": 0.057, "lr": 0.17643902407337023, "epoch": 0.8670266044511763, "percentage": 44.36, "elapsed_time": "18:41:36", "remaining_time": "23:26:39", "throughput": 333.97, "total_tokens": 22474880} {"current_steps": 17750, "total_steps": 40000, "loss": 0.0494, "lr": 0.17638103941108993, "epoch": 0.8672709061148707, "percentage": 44.38, "elapsed_time": "18:41:39", "remaining_time": "23:26:00", "throughput": 334.04, "total_tokens": 22480832} {"current_steps": 17755, "total_steps": 40000, "loss": 0.093, "lr": 0.1763230506805218, "epoch": 0.867515207778565, "percentage": 44.39, "elapsed_time": "18:41:42", "remaining_time": "23:25:21", "throughput": 334.12, "total_tokens": 22486848} {"current_steps": 17760, "total_steps": 40000, "loss": 0.0567, "lr": 0.1762650578906085, "epoch": 0.8677595094422593, "percentage": 44.4, "elapsed_time": "18:41:45", "remaining_time": "23:24:43", "throughput": 334.2, "total_tokens": 22493344} {"current_steps": 17765, "total_steps": 40000, "loss": 0.0733, "lr": 0.1762070610502932, "epoch": 0.8680038111059536, "percentage": 44.41, "elapsed_time": "18:41:48", "remaining_time": "23:24:04", "throughput": 334.28, "total_tokens": 22499776} {"current_steps": 17770, "total_steps": 40000, "loss": 0.0736, "lr": 0.17614906016851975, "epoch": 0.868248112769648, "percentage": 44.42, "elapsed_time": "18:41:51", "remaining_time": "23:23:25", "throughput": 334.35, "total_tokens": 22505536} {"current_steps": 17775, "total_steps": 40000, "loss": 0.0482, "lr": 0.17609105525423258, "epoch": 0.8684924144333422, "percentage": 44.44, "elapsed_time": "18:41:54", "remaining_time": "23:22:46", "throughput": 334.43, "total_tokens": 22512256} {"current_steps": 17780, "total_steps": 40000, "loss": 0.0752, "lr": 0.1760330463163768, "epoch": 0.8687367160970366, "percentage": 44.45, "elapsed_time": "18:41:57", "remaining_time": "23:22:08", "throughput": 334.52, "total_tokens": 22518784} {"current_steps": 17785, "total_steps": 40000, "loss": 0.07, "lr": 0.17597503336389816, "epoch": 0.868981017760731, "percentage": 44.46, "elapsed_time": "18:42:00", "remaining_time": "23:21:29", "throughput": 334.59, "total_tokens": 22524896} {"current_steps": 17790, "total_steps": 40000, "loss": 0.0649, "lr": 0.17591701640574298, "epoch": 0.8692253194244253, "percentage": 44.47, "elapsed_time": "18:42:03", "remaining_time": "23:20:50", "throughput": 334.67, "total_tokens": 22531488} {"current_steps": 17795, "total_steps": 40000, "loss": 0.0759, "lr": 0.17585899545085815, "epoch": 0.8694696210881196, "percentage": 44.49, "elapsed_time": "18:42:06", "remaining_time": "23:20:12", "throughput": 334.75, "total_tokens": 22537792} {"current_steps": 17800, "total_steps": 40000, "loss": 0.0735, "lr": 0.17580097050819124, "epoch": 0.8697139227518139, "percentage": 44.5, "elapsed_time": "18:42:09", "remaining_time": "23:19:33", "throughput": 334.83, "total_tokens": 22543904} {"current_steps": 17800, "total_steps": 40000, "eval_loss": 0.07252977043390274, "epoch": 0.8697139227518139, "percentage": 44.5, "elapsed_time": "18:52:50", "remaining_time": "23:32:51", "throughput": 331.67, "total_tokens": 22543904} {"current_steps": 17805, "total_steps": 40000, "loss": 0.0739, "lr": 0.17574294158669046, "epoch": 0.8699582244155083, "percentage": 44.51, "elapsed_time": "18:52:53", "remaining_time": "23:32:13", "throughput": 331.75, "total_tokens": 22550208} {"current_steps": 17810, "total_steps": 40000, "loss": 0.0731, "lr": 0.17568490869530456, "epoch": 0.8702025260792026, "percentage": 44.52, "elapsed_time": "18:52:57", "remaining_time": "23:31:34", "throughput": 331.82, "total_tokens": 22556384} {"current_steps": 17815, "total_steps": 40000, "loss": 0.0694, "lr": 0.17562687184298295, "epoch": 0.870446827742897, "percentage": 44.54, "elapsed_time": "18:53:00", "remaining_time": "23:30:55", "throughput": 331.9, "total_tokens": 22562656} {"current_steps": 17820, "total_steps": 40000, "loss": 0.0816, "lr": 0.1755688310386757, "epoch": 0.8706911294065912, "percentage": 44.55, "elapsed_time": "18:53:03", "remaining_time": "23:30:16", "throughput": 331.98, "total_tokens": 22568896} {"current_steps": 17825, "total_steps": 40000, "loss": 0.0547, "lr": 0.17551078629133335, "epoch": 0.8709354310702856, "percentage": 44.56, "elapsed_time": "18:53:06", "remaining_time": "23:29:37", "throughput": 332.06, "total_tokens": 22575296} {"current_steps": 17830, "total_steps": 40000, "loss": 0.0579, "lr": 0.17545273760990718, "epoch": 0.87117973273398, "percentage": 44.57, "elapsed_time": "18:53:09", "remaining_time": "23:28:58", "throughput": 332.13, "total_tokens": 22581376} {"current_steps": 17835, "total_steps": 40000, "loss": 0.0572, "lr": 0.17539468500334904, "epoch": 0.8714240343976742, "percentage": 44.59, "elapsed_time": "18:53:12", "remaining_time": "23:28:19", "throughput": 332.21, "total_tokens": 22587968} {"current_steps": 17840, "total_steps": 40000, "loss": 0.0633, "lr": 0.17533662848061132, "epoch": 0.8716683360613686, "percentage": 44.6, "elapsed_time": "18:53:15", "remaining_time": "23:27:40", "throughput": 332.3, "total_tokens": 22594848} {"current_steps": 17845, "total_steps": 40000, "loss": 0.0718, "lr": 0.1752785680506471, "epoch": 0.8719126377250629, "percentage": 44.61, "elapsed_time": "18:53:18", "remaining_time": "23:27:02", "throughput": 332.38, "total_tokens": 22601120} {"current_steps": 17850, "total_steps": 40000, "loss": 0.0491, "lr": 0.17522050372241, "epoch": 0.8721569393887573, "percentage": 44.62, "elapsed_time": "18:53:21", "remaining_time": "23:26:23", "throughput": 332.45, "total_tokens": 22607488} {"current_steps": 17855, "total_steps": 40000, "loss": 0.0687, "lr": 0.17516243550485425, "epoch": 0.8724012410524515, "percentage": 44.64, "elapsed_time": "18:53:24", "remaining_time": "23:25:44", "throughput": 332.53, "total_tokens": 22613728} {"current_steps": 17860, "total_steps": 40000, "loss": 0.0637, "lr": 0.17510436340693478, "epoch": 0.8726455427161459, "percentage": 44.65, "elapsed_time": "18:53:27", "remaining_time": "23:25:05", "throughput": 332.61, "total_tokens": 22619776} {"current_steps": 17865, "total_steps": 40000, "loss": 0.0527, "lr": 0.175046287437607, "epoch": 0.8728898443798402, "percentage": 44.66, "elapsed_time": "18:53:30", "remaining_time": "23:24:26", "throughput": 332.68, "total_tokens": 22626112} {"current_steps": 17870, "total_steps": 40000, "loss": 0.0723, "lr": 0.17498820760582695, "epoch": 0.8731341460435346, "percentage": 44.67, "elapsed_time": "18:53:34", "remaining_time": "23:23:47", "throughput": 332.77, "total_tokens": 22632704} {"current_steps": 17875, "total_steps": 40000, "loss": 0.0392, "lr": 0.1749301239205512, "epoch": 0.8733784477072288, "percentage": 44.69, "elapsed_time": "18:53:37", "remaining_time": "23:23:09", "throughput": 332.84, "total_tokens": 22639008} {"current_steps": 17880, "total_steps": 40000, "loss": 0.0629, "lr": 0.1748720363907371, "epoch": 0.8736227493709232, "percentage": 44.7, "elapsed_time": "18:53:40", "remaining_time": "23:22:30", "throughput": 332.92, "total_tokens": 22645152} {"current_steps": 17885, "total_steps": 40000, "loss": 0.0663, "lr": 0.17481394502534242, "epoch": 0.8738670510346176, "percentage": 44.71, "elapsed_time": "18:53:43", "remaining_time": "23:21:51", "throughput": 332.99, "total_tokens": 22650944} {"current_steps": 17890, "total_steps": 40000, "loss": 0.0563, "lr": 0.17475584983332562, "epoch": 0.8741113526983119, "percentage": 44.73, "elapsed_time": "18:53:46", "remaining_time": "23:21:13", "throughput": 333.08, "total_tokens": 22658176} {"current_steps": 17895, "total_steps": 40000, "loss": 0.0672, "lr": 0.17469775082364558, "epoch": 0.8743556543620062, "percentage": 44.74, "elapsed_time": "18:53:49", "remaining_time": "23:20:34", "throughput": 333.15, "total_tokens": 22664320} {"current_steps": 17900, "total_steps": 40000, "loss": 0.077, "lr": 0.17463964800526205, "epoch": 0.8745999560257005, "percentage": 44.75, "elapsed_time": "18:53:52", "remaining_time": "23:19:55", "throughput": 333.23, "total_tokens": 22670400} {"current_steps": 17905, "total_steps": 40000, "loss": 0.0668, "lr": 0.17458154138713522, "epoch": 0.8748442576893949, "percentage": 44.76, "elapsed_time": "18:53:55", "remaining_time": "23:19:16", "throughput": 333.3, "total_tokens": 22676384} {"current_steps": 17910, "total_steps": 40000, "loss": 0.0633, "lr": 0.17452343097822576, "epoch": 0.8750885593530892, "percentage": 44.77, "elapsed_time": "18:53:58", "remaining_time": "23:18:38", "throughput": 333.38, "total_tokens": 22683040} {"current_steps": 17915, "total_steps": 40000, "loss": 0.0777, "lr": 0.17446531678749497, "epoch": 0.8753328610167835, "percentage": 44.79, "elapsed_time": "18:54:01", "remaining_time": "23:17:59", "throughput": 333.46, "total_tokens": 22689536} {"current_steps": 17920, "total_steps": 40000, "loss": 0.0467, "lr": 0.17440719882390496, "epoch": 0.8755771626804778, "percentage": 44.8, "elapsed_time": "18:54:04", "remaining_time": "23:17:21", "throughput": 333.54, "total_tokens": 22695936} {"current_steps": 17925, "total_steps": 40000, "loss": 0.0668, "lr": 0.17434907709641814, "epoch": 0.8758214643441722, "percentage": 44.81, "elapsed_time": "18:54:07", "remaining_time": "23:16:42", "throughput": 333.62, "total_tokens": 22702176} {"current_steps": 17930, "total_steps": 40000, "loss": 0.0683, "lr": 0.17429095161399769, "epoch": 0.8760657660078666, "percentage": 44.82, "elapsed_time": "18:54:11", "remaining_time": "23:16:03", "throughput": 333.7, "total_tokens": 22708608} {"current_steps": 17935, "total_steps": 40000, "loss": 0.0524, "lr": 0.1742328223856072, "epoch": 0.8763100676715608, "percentage": 44.84, "elapsed_time": "18:54:14", "remaining_time": "23:15:25", "throughput": 333.77, "total_tokens": 22714528} {"current_steps": 17940, "total_steps": 40000, "loss": 0.0713, "lr": 0.174174689420211, "epoch": 0.8765543693352552, "percentage": 44.85, "elapsed_time": "18:54:17", "remaining_time": "23:14:46", "throughput": 333.85, "total_tokens": 22720896} {"current_steps": 17945, "total_steps": 40000, "loss": 0.0468, "lr": 0.1741165527267739, "epoch": 0.8767986709989495, "percentage": 44.86, "elapsed_time": "18:54:20", "remaining_time": "23:14:08", "throughput": 333.93, "total_tokens": 22727328} {"current_steps": 17950, "total_steps": 40000, "loss": 0.0724, "lr": 0.17405841231426125, "epoch": 0.8770429726626439, "percentage": 44.88, "elapsed_time": "18:54:23", "remaining_time": "23:13:29", "throughput": 334.01, "total_tokens": 22733632} {"current_steps": 17955, "total_steps": 40000, "loss": 0.0874, "lr": 0.1740002681916391, "epoch": 0.8772872743263381, "percentage": 44.89, "elapsed_time": "18:54:26", "remaining_time": "23:12:51", "throughput": 334.09, "total_tokens": 22740128} {"current_steps": 17960, "total_steps": 40000, "loss": 0.056, "lr": 0.17394212036787401, "epoch": 0.8775315759900325, "percentage": 44.9, "elapsed_time": "18:54:29", "remaining_time": "23:12:13", "throughput": 334.16, "total_tokens": 22746176} {"current_steps": 17965, "total_steps": 40000, "loss": 0.0926, "lr": 0.1738839688519331, "epoch": 0.8777758776537268, "percentage": 44.91, "elapsed_time": "18:54:32", "remaining_time": "23:11:34", "throughput": 334.23, "total_tokens": 22752128} {"current_steps": 17970, "total_steps": 40000, "loss": 0.0551, "lr": 0.17382581365278402, "epoch": 0.8780201793174212, "percentage": 44.92, "elapsed_time": "18:54:35", "remaining_time": "23:10:56", "throughput": 334.31, "total_tokens": 22758560} {"current_steps": 17975, "total_steps": 40000, "loss": 0.0792, "lr": 0.17376765477939507, "epoch": 0.8782644809811155, "percentage": 44.94, "elapsed_time": "18:54:38", "remaining_time": "23:10:17", "throughput": 334.39, "total_tokens": 22764864} {"current_steps": 17980, "total_steps": 40000, "loss": 0.0547, "lr": 0.1737094922407351, "epoch": 0.8785087826448098, "percentage": 44.95, "elapsed_time": "18:54:41", "remaining_time": "23:09:39", "throughput": 334.47, "total_tokens": 22771264} {"current_steps": 17985, "total_steps": 40000, "loss": 0.0661, "lr": 0.1736513260457734, "epoch": 0.8787530843085042, "percentage": 44.96, "elapsed_time": "18:54:45", "remaining_time": "23:09:01", "throughput": 334.54, "total_tokens": 22777376} {"current_steps": 17990, "total_steps": 40000, "loss": 0.0652, "lr": 0.17359315620348006, "epoch": 0.8789973859721985, "percentage": 44.98, "elapsed_time": "18:54:48", "remaining_time": "23:08:22", "throughput": 334.62, "total_tokens": 22783520} {"current_steps": 17995, "total_steps": 40000, "loss": 0.0589, "lr": 0.17353498272282547, "epoch": 0.8792416876358928, "percentage": 44.99, "elapsed_time": "18:54:51", "remaining_time": "23:07:44", "throughput": 334.7, "total_tokens": 22790048} {"current_steps": 18000, "total_steps": 40000, "loss": 0.0626, "lr": 0.17347680561278087, "epoch": 0.8794859892995871, "percentage": 45.0, "elapsed_time": "18:54:54", "remaining_time": "23:07:06", "throughput": 334.78, "total_tokens": 22796480} {"current_steps": 18000, "total_steps": 40000, "eval_loss": 0.06703109294176102, "epoch": 0.8794859892995871, "percentage": 45.0, "elapsed_time": "19:05:34", "remaining_time": "23:20:09", "throughput": 331.66, "total_tokens": 22796480} {"current_steps": 18005, "total_steps": 40000, "loss": 0.0483, "lr": 0.1734186248823178, "epoch": 0.8797302909632815, "percentage": 45.01, "elapsed_time": "19:05:41", "remaining_time": "23:19:34", "throughput": 331.72, "total_tokens": 22802848} {"current_steps": 18010, "total_steps": 40000, "loss": 0.0571, "lr": 0.17336044054040844, "epoch": 0.8799745926269757, "percentage": 45.02, "elapsed_time": "19:05:44", "remaining_time": "23:18:56", "throughput": 331.79, "total_tokens": 22808992} {"current_steps": 18015, "total_steps": 40000, "loss": 0.0704, "lr": 0.1733022525960256, "epoch": 0.8802188942906701, "percentage": 45.04, "elapsed_time": "19:05:47", "remaining_time": "23:18:17", "throughput": 331.87, "total_tokens": 22815168} {"current_steps": 18020, "total_steps": 40000, "loss": 0.0711, "lr": 0.1732440610581426, "epoch": 0.8804631959543644, "percentage": 45.05, "elapsed_time": "19:05:50", "remaining_time": "23:17:39", "throughput": 331.94, "total_tokens": 22821376} {"current_steps": 18025, "total_steps": 40000, "loss": 0.0684, "lr": 0.17318586593573326, "epoch": 0.8807074976180588, "percentage": 45.06, "elapsed_time": "19:05:53", "remaining_time": "23:17:00", "throughput": 332.01, "total_tokens": 22827200} {"current_steps": 18030, "total_steps": 40000, "loss": 0.0614, "lr": 0.17312766723777204, "epoch": 0.8809517992817532, "percentage": 45.07, "elapsed_time": "19:05:56", "remaining_time": "23:16:21", "throughput": 332.1, "total_tokens": 22834048} {"current_steps": 18035, "total_steps": 40000, "loss": 0.0859, "lr": 0.1730694649732339, "epoch": 0.8811961009454474, "percentage": 45.09, "elapsed_time": "19:06:00", "remaining_time": "23:15:43", "throughput": 332.18, "total_tokens": 22840672} {"current_steps": 18040, "total_steps": 40000, "loss": 0.0414, "lr": 0.17301125915109428, "epoch": 0.8814404026091418, "percentage": 45.1, "elapsed_time": "19:06:03", "remaining_time": "23:15:05", "throughput": 332.26, "total_tokens": 22847008} {"current_steps": 18045, "total_steps": 40000, "loss": 0.075, "lr": 0.17295304978032938, "epoch": 0.8816847042728361, "percentage": 45.11, "elapsed_time": "19:06:06", "remaining_time": "23:14:26", "throughput": 332.34, "total_tokens": 22853856} {"current_steps": 18050, "total_steps": 40000, "loss": 0.0653, "lr": 0.17289483686991577, "epoch": 0.8819290059365305, "percentage": 45.12, "elapsed_time": "19:06:09", "remaining_time": "23:13:48", "throughput": 332.42, "total_tokens": 22860096} {"current_steps": 18055, "total_steps": 40000, "loss": 0.0545, "lr": 0.1728366204288306, "epoch": 0.8821733076002247, "percentage": 45.14, "elapsed_time": "19:06:12", "remaining_time": "23:13:09", "throughput": 332.51, "total_tokens": 22867456} {"current_steps": 18060, "total_steps": 40000, "loss": 0.0363, "lr": 0.17277840046605153, "epoch": 0.8824176092639191, "percentage": 45.15, "elapsed_time": "19:06:15", "remaining_time": "23:12:31", "throughput": 332.58, "total_tokens": 22873248} {"current_steps": 18065, "total_steps": 40000, "loss": 0.0415, "lr": 0.17272017699055686, "epoch": 0.8826619109276134, "percentage": 45.16, "elapsed_time": "19:06:18", "remaining_time": "23:11:53", "throughput": 332.66, "total_tokens": 22879680} {"current_steps": 18070, "total_steps": 40000, "loss": 0.0619, "lr": 0.17266195001132542, "epoch": 0.8829062125913077, "percentage": 45.17, "elapsed_time": "19:06:21", "remaining_time": "23:11:14", "throughput": 332.73, "total_tokens": 22885920} {"current_steps": 18075, "total_steps": 40000, "loss": 0.037, "lr": 0.17260371953733647, "epoch": 0.8831505142550021, "percentage": 45.19, "elapsed_time": "19:06:24", "remaining_time": "23:10:36", "throughput": 332.81, "total_tokens": 22892480} {"current_steps": 18080, "total_steps": 40000, "loss": 0.0759, "lr": 0.1725454855775699, "epoch": 0.8833948159186964, "percentage": 45.2, "elapsed_time": "19:06:27", "remaining_time": "23:09:57", "throughput": 332.88, "total_tokens": 22898208} {"current_steps": 18085, "total_steps": 40000, "loss": 0.0851, "lr": 0.17248724814100616, "epoch": 0.8836391175823908, "percentage": 45.21, "elapsed_time": "19:06:30", "remaining_time": "23:09:19", "throughput": 332.95, "total_tokens": 22904128} {"current_steps": 18090, "total_steps": 40000, "loss": 0.0641, "lr": 0.17242900723662619, "epoch": 0.883883419246085, "percentage": 45.23, "elapsed_time": "19:06:33", "remaining_time": "23:08:40", "throughput": 333.03, "total_tokens": 22910176} {"current_steps": 18095, "total_steps": 40000, "loss": 0.0896, "lr": 0.1723707628734114, "epoch": 0.8841277209097794, "percentage": 45.24, "elapsed_time": "19:06:36", "remaining_time": "23:08:02", "throughput": 333.1, "total_tokens": 22916160} {"current_steps": 18100, "total_steps": 40000, "loss": 0.0736, "lr": 0.1723125150603438, "epoch": 0.8843720225734737, "percentage": 45.25, "elapsed_time": "19:06:40", "remaining_time": "23:07:24", "throughput": 333.17, "total_tokens": 22922432} {"current_steps": 18105, "total_steps": 40000, "loss": 0.0736, "lr": 0.1722542638064061, "epoch": 0.8846163242371681, "percentage": 45.26, "elapsed_time": "19:06:43", "remaining_time": "23:06:46", "throughput": 333.25, "total_tokens": 22928864} {"current_steps": 18110, "total_steps": 40000, "loss": 0.0452, "lr": 0.17219600912058117, "epoch": 0.8848606259008623, "percentage": 45.27, "elapsed_time": "19:06:46", "remaining_time": "23:06:07", "throughput": 333.33, "total_tokens": 22934848} {"current_steps": 18115, "total_steps": 40000, "loss": 0.092, "lr": 0.17213775101185272, "epoch": 0.8851049275645567, "percentage": 45.29, "elapsed_time": "19:06:49", "remaining_time": "23:05:29", "throughput": 333.4, "total_tokens": 22940928} {"current_steps": 18120, "total_steps": 40000, "loss": 0.0514, "lr": 0.17207948948920485, "epoch": 0.885349229228251, "percentage": 45.3, "elapsed_time": "19:06:52", "remaining_time": "23:04:51", "throughput": 333.48, "total_tokens": 22947744} {"current_steps": 18125, "total_steps": 40000, "loss": 0.0521, "lr": 0.17202122456162228, "epoch": 0.8855935308919454, "percentage": 45.31, "elapsed_time": "19:06:55", "remaining_time": "23:04:13", "throughput": 333.56, "total_tokens": 22954336} {"current_steps": 18130, "total_steps": 40000, "loss": 0.0863, "lr": 0.17196295623809013, "epoch": 0.8858378325556397, "percentage": 45.32, "elapsed_time": "19:06:58", "remaining_time": "23:03:35", "throughput": 333.64, "total_tokens": 22960704} {"current_steps": 18135, "total_steps": 40000, "loss": 0.0528, "lr": 0.1719046845275941, "epoch": 0.886082134219334, "percentage": 45.34, "elapsed_time": "19:07:01", "remaining_time": "23:02:56", "throughput": 333.71, "total_tokens": 22966784} {"current_steps": 18140, "total_steps": 40000, "loss": 0.0418, "lr": 0.17184640943912044, "epoch": 0.8863264358830284, "percentage": 45.35, "elapsed_time": "19:07:04", "remaining_time": "23:02:18", "throughput": 333.79, "total_tokens": 22972960} {"current_steps": 18145, "total_steps": 40000, "loss": 0.0511, "lr": 0.1717881309816559, "epoch": 0.8865707375467227, "percentage": 45.36, "elapsed_time": "19:07:07", "remaining_time": "23:01:40", "throughput": 333.87, "total_tokens": 22979872} {"current_steps": 18150, "total_steps": 40000, "loss": 0.0411, "lr": 0.1717298491641878, "epoch": 0.886815039210417, "percentage": 45.38, "elapsed_time": "19:07:11", "remaining_time": "23:01:02", "throughput": 333.95, "total_tokens": 22986432} {"current_steps": 18155, "total_steps": 40000, "loss": 0.0497, "lr": 0.17167156399570385, "epoch": 0.8870593408741113, "percentage": 45.39, "elapsed_time": "19:07:14", "remaining_time": "23:00:24", "throughput": 334.03, "total_tokens": 22992800} {"current_steps": 18160, "total_steps": 40000, "loss": 0.0671, "lr": 0.17161327548519242, "epoch": 0.8873036425378057, "percentage": 45.4, "elapsed_time": "19:07:17", "remaining_time": "22:59:46", "throughput": 334.11, "total_tokens": 22999072} {"current_steps": 18165, "total_steps": 40000, "loss": 0.056, "lr": 0.1715549836416423, "epoch": 0.8875479442015, "percentage": 45.41, "elapsed_time": "19:07:20", "remaining_time": "22:59:08", "throughput": 334.19, "total_tokens": 23005472} {"current_steps": 18170, "total_steps": 40000, "loss": 0.056, "lr": 0.17149668847404279, "epoch": 0.8877922458651943, "percentage": 45.42, "elapsed_time": "19:07:23", "remaining_time": "22:58:30", "throughput": 334.26, "total_tokens": 23011488} {"current_steps": 18175, "total_steps": 40000, "loss": 0.1023, "lr": 0.1714383899913838, "epoch": 0.8880365475288887, "percentage": 45.44, "elapsed_time": "19:07:26", "remaining_time": "22:57:52", "throughput": 334.34, "total_tokens": 23017824} {"current_steps": 18180, "total_steps": 40000, "loss": 0.0566, "lr": 0.17138008820265563, "epoch": 0.888280849192583, "percentage": 45.45, "elapsed_time": "19:07:29", "remaining_time": "22:57:14", "throughput": 334.41, "total_tokens": 23024000} {"current_steps": 18185, "total_steps": 40000, "loss": 0.0413, "lr": 0.17132178311684917, "epoch": 0.8885251508562774, "percentage": 45.46, "elapsed_time": "19:07:32", "remaining_time": "22:56:36", "throughput": 334.49, "total_tokens": 23030592} {"current_steps": 18190, "total_steps": 40000, "loss": 0.0626, "lr": 0.1712634747429559, "epoch": 0.8887694525199716, "percentage": 45.48, "elapsed_time": "19:07:35", "remaining_time": "22:55:58", "throughput": 334.57, "total_tokens": 23036928} {"current_steps": 18195, "total_steps": 40000, "loss": 0.0692, "lr": 0.17120516308996753, "epoch": 0.889013754183666, "percentage": 45.49, "elapsed_time": "19:07:38", "remaining_time": "22:55:21", "throughput": 334.65, "total_tokens": 23043744} {"current_steps": 18200, "total_steps": 40000, "loss": 0.0883, "lr": 0.17114684816687653, "epoch": 0.8892580558473603, "percentage": 45.5, "elapsed_time": "19:07:42", "remaining_time": "22:54:43", "throughput": 334.73, "total_tokens": 23050080} {"current_steps": 18200, "total_steps": 40000, "eval_loss": 0.06575492769479752, "epoch": 0.8892580558473603, "percentage": 45.5, "elapsed_time": "19:18:22", "remaining_time": "23:07:30", "throughput": 331.64, "total_tokens": 23050080} {"current_steps": 18205, "total_steps": 40000, "loss": 0.0601, "lr": 0.17108852998267585, "epoch": 0.8895023575110547, "percentage": 45.51, "elapsed_time": "19:18:26", "remaining_time": "23:06:52", "throughput": 331.72, "total_tokens": 23056480} {"current_steps": 18210, "total_steps": 40000, "loss": 0.0719, "lr": 0.17103020854635878, "epoch": 0.8897466591747489, "percentage": 45.52, "elapsed_time": "19:18:29", "remaining_time": "23:06:14", "throughput": 331.79, "total_tokens": 23062464} {"current_steps": 18215, "total_steps": 40000, "loss": 0.0862, "lr": 0.1709718838669193, "epoch": 0.8899909608384433, "percentage": 45.54, "elapsed_time": "19:18:32", "remaining_time": "23:05:36", "throughput": 331.87, "total_tokens": 23068864} {"current_steps": 18220, "total_steps": 40000, "loss": 0.0629, "lr": 0.17091355595335173, "epoch": 0.8902352625021377, "percentage": 45.55, "elapsed_time": "19:18:35", "remaining_time": "23:04:58", "throughput": 331.94, "total_tokens": 23074688} {"current_steps": 18225, "total_steps": 40000, "loss": 0.0581, "lr": 0.17085522481465107, "epoch": 0.890479564165832, "percentage": 45.56, "elapsed_time": "19:18:38", "remaining_time": "23:04:20", "throughput": 332.02, "total_tokens": 23081408} {"current_steps": 18230, "total_steps": 40000, "loss": 0.0384, "lr": 0.17079689045981264, "epoch": 0.8907238658295263, "percentage": 45.57, "elapsed_time": "19:18:41", "remaining_time": "23:03:41", "throughput": 332.09, "total_tokens": 23087648} {"current_steps": 18235, "total_steps": 40000, "loss": 0.0581, "lr": 0.17073855289783238, "epoch": 0.8909681674932206, "percentage": 45.59, "elapsed_time": "19:18:44", "remaining_time": "23:03:03", "throughput": 332.17, "total_tokens": 23093792} {"current_steps": 18240, "total_steps": 40000, "loss": 0.0732, "lr": 0.1706802121377066, "epoch": 0.891212469156915, "percentage": 45.6, "elapsed_time": "19:18:47", "remaining_time": "23:02:25", "throughput": 332.24, "total_tokens": 23100000} {"current_steps": 18245, "total_steps": 40000, "loss": 0.0594, "lr": 0.17062186818843225, "epoch": 0.8914567708206093, "percentage": 45.61, "elapsed_time": "19:18:50", "remaining_time": "23:01:47", "throughput": 332.31, "total_tokens": 23106016} {"current_steps": 18250, "total_steps": 40000, "loss": 0.0858, "lr": 0.17056352105900668, "epoch": 0.8917010724843036, "percentage": 45.62, "elapsed_time": "19:18:53", "remaining_time": "23:01:09", "throughput": 332.39, "total_tokens": 23112096} {"current_steps": 18255, "total_steps": 40000, "loss": 0.071, "lr": 0.17050517075842772, "epoch": 0.8919453741479979, "percentage": 45.64, "elapsed_time": "19:18:57", "remaining_time": "23:00:31", "throughput": 332.47, "total_tokens": 23118688} {"current_steps": 18260, "total_steps": 40000, "loss": 0.0535, "lr": 0.17044681729569375, "epoch": 0.8921896758116923, "percentage": 45.65, "elapsed_time": "19:19:00", "remaining_time": "22:59:53", "throughput": 332.54, "total_tokens": 23125088} {"current_steps": 18265, "total_steps": 40000, "loss": 0.0826, "lr": 0.17038846067980365, "epoch": 0.8924339774753866, "percentage": 45.66, "elapsed_time": "19:19:03", "remaining_time": "22:59:15", "throughput": 332.61, "total_tokens": 23131104} {"current_steps": 18270, "total_steps": 40000, "loss": 0.0637, "lr": 0.17033010091975664, "epoch": 0.8926782791390809, "percentage": 45.67, "elapsed_time": "19:19:06", "remaining_time": "22:58:37", "throughput": 332.7, "total_tokens": 23137920} {"current_steps": 18275, "total_steps": 40000, "loss": 0.066, "lr": 0.17027173802455262, "epoch": 0.8929225808027753, "percentage": 45.69, "elapsed_time": "19:19:09", "remaining_time": "22:57:59", "throughput": 332.77, "total_tokens": 23144224} {"current_steps": 18280, "total_steps": 40000, "loss": 0.0519, "lr": 0.1702133720031918, "epoch": 0.8931668824664696, "percentage": 45.7, "elapsed_time": "19:19:12", "remaining_time": "22:57:21", "throughput": 332.85, "total_tokens": 23150592} {"current_steps": 18285, "total_steps": 40000, "loss": 0.0635, "lr": 0.17015500286467503, "epoch": 0.893411184130164, "percentage": 45.71, "elapsed_time": "19:19:15", "remaining_time": "22:56:43", "throughput": 332.93, "total_tokens": 23157088} {"current_steps": 18290, "total_steps": 40000, "loss": 0.0455, "lr": 0.17009663061800354, "epoch": 0.8936554857938582, "percentage": 45.73, "elapsed_time": "19:19:18", "remaining_time": "22:56:05", "throughput": 333.01, "total_tokens": 23164096} {"current_steps": 18295, "total_steps": 40000, "loss": 0.0566, "lr": 0.17003825527217903, "epoch": 0.8938997874575526, "percentage": 45.74, "elapsed_time": "19:19:22", "remaining_time": "22:55:27", "throughput": 333.09, "total_tokens": 23170368} {"current_steps": 18300, "total_steps": 40000, "loss": 0.0273, "lr": 0.16997987683620377, "epoch": 0.8941440891212469, "percentage": 45.75, "elapsed_time": "19:19:25", "remaining_time": "22:54:49", "throughput": 333.17, "total_tokens": 23176896} {"current_steps": 18305, "total_steps": 40000, "loss": 0.0574, "lr": 0.16992149531908043, "epoch": 0.8943883907849413, "percentage": 45.76, "elapsed_time": "19:19:28", "remaining_time": "22:54:11", "throughput": 333.24, "total_tokens": 23183040} {"current_steps": 18310, "total_steps": 40000, "loss": 0.0856, "lr": 0.16986311072981214, "epoch": 0.8946326924486355, "percentage": 45.77, "elapsed_time": "19:19:31", "remaining_time": "22:53:34", "throughput": 333.32, "total_tokens": 23189504} {"current_steps": 18315, "total_steps": 40000, "loss": 0.0644, "lr": 0.16980472307740255, "epoch": 0.8948769941123299, "percentage": 45.79, "elapsed_time": "19:19:34", "remaining_time": "22:52:56", "throughput": 333.4, "total_tokens": 23195808} {"current_steps": 18320, "total_steps": 40000, "loss": 0.0692, "lr": 0.1697463323708558, "epoch": 0.8951212957760243, "percentage": 45.8, "elapsed_time": "19:19:37", "remaining_time": "22:52:18", "throughput": 333.48, "total_tokens": 23202528} {"current_steps": 18325, "total_steps": 40000, "loss": 0.1001, "lr": 0.16968793861917641, "epoch": 0.8953655974397186, "percentage": 45.81, "elapsed_time": "19:19:40", "remaining_time": "22:51:40", "throughput": 333.55, "total_tokens": 23208416} {"current_steps": 18330, "total_steps": 40000, "loss": 0.058, "lr": 0.16962954183136952, "epoch": 0.8956098991034129, "percentage": 45.82, "elapsed_time": "19:19:43", "remaining_time": "22:51:02", "throughput": 333.63, "total_tokens": 23214976} {"current_steps": 18335, "total_steps": 40000, "loss": 0.0473, "lr": 0.16957114201644058, "epoch": 0.8958542007671072, "percentage": 45.84, "elapsed_time": "19:19:46", "remaining_time": "22:50:25", "throughput": 333.7, "total_tokens": 23221056} {"current_steps": 18340, "total_steps": 40000, "loss": 0.0768, "lr": 0.16951273918339563, "epoch": 0.8960985024308016, "percentage": 45.85, "elapsed_time": "19:19:49", "remaining_time": "22:49:47", "throughput": 333.78, "total_tokens": 23227392} {"current_steps": 18345, "total_steps": 40000, "loss": 0.0548, "lr": 0.16945433334124105, "epoch": 0.8963428040944958, "percentage": 45.86, "elapsed_time": "19:19:52", "remaining_time": "22:49:09", "throughput": 333.85, "total_tokens": 23233376} {"current_steps": 18350, "total_steps": 40000, "loss": 0.0447, "lr": 0.1693959244989838, "epoch": 0.8965871057581902, "percentage": 45.88, "elapsed_time": "19:19:55", "remaining_time": "22:48:31", "throughput": 333.92, "total_tokens": 23239520} {"current_steps": 18355, "total_steps": 40000, "loss": 0.0692, "lr": 0.16933751266563127, "epoch": 0.8968314074218845, "percentage": 45.89, "elapsed_time": "19:19:59", "remaining_time": "22:47:54", "throughput": 334.0, "total_tokens": 23246272} {"current_steps": 18360, "total_steps": 40000, "loss": 0.0677, "lr": 0.16927909785019118, "epoch": 0.8970757090855789, "percentage": 45.9, "elapsed_time": "19:20:02", "remaining_time": "22:47:16", "throughput": 334.07, "total_tokens": 23252320} {"current_steps": 18365, "total_steps": 40000, "loss": 0.0739, "lr": 0.169220680061672, "epoch": 0.8973200107492733, "percentage": 45.91, "elapsed_time": "19:20:05", "remaining_time": "22:46:38", "throughput": 334.15, "total_tokens": 23258528} {"current_steps": 18370, "total_steps": 40000, "loss": 0.0653, "lr": 0.16916225930908244, "epoch": 0.8975643124129675, "percentage": 45.92, "elapsed_time": "19:20:08", "remaining_time": "22:46:01", "throughput": 334.23, "total_tokens": 23265024} {"current_steps": 18375, "total_steps": 40000, "loss": 0.0572, "lr": 0.16910383560143163, "epoch": 0.8978086140766619, "percentage": 45.94, "elapsed_time": "19:20:11", "remaining_time": "22:45:23", "throughput": 334.31, "total_tokens": 23271520} {"current_steps": 18380, "total_steps": 40000, "loss": 0.0781, "lr": 0.16904540894772935, "epoch": 0.8980529157403562, "percentage": 45.95, "elapsed_time": "19:20:14", "remaining_time": "22:44:45", "throughput": 334.38, "total_tokens": 23277632} {"current_steps": 18385, "total_steps": 40000, "loss": 0.0589, "lr": 0.16898697935698562, "epoch": 0.8982972174040506, "percentage": 45.96, "elapsed_time": "19:20:17", "remaining_time": "22:44:08", "throughput": 334.46, "total_tokens": 23284608} {"current_steps": 18390, "total_steps": 40000, "loss": 0.0993, "lr": 0.1689285468382111, "epoch": 0.8985415190677448, "percentage": 45.98, "elapsed_time": "19:20:20", "remaining_time": "22:43:30", "throughput": 334.54, "total_tokens": 23290976} {"current_steps": 18395, "total_steps": 40000, "loss": 0.0769, "lr": 0.16887011140041677, "epoch": 0.8987858207314392, "percentage": 45.99, "elapsed_time": "19:20:23", "remaining_time": "22:42:53", "throughput": 334.62, "total_tokens": 23297728} {"current_steps": 18400, "total_steps": 40000, "loss": 0.0479, "lr": 0.1688116730526141, "epoch": 0.8990301223951335, "percentage": 46.0, "elapsed_time": "19:20:26", "remaining_time": "22:42:16", "throughput": 334.7, "total_tokens": 23304192} {"current_steps": 18400, "total_steps": 40000, "eval_loss": 0.06781475991010666, "epoch": 0.8990301223951335, "percentage": 46.0, "elapsed_time": "19:31:07", "remaining_time": "22:54:47", "throughput": 331.65, "total_tokens": 23304192} {"current_steps": 18405, "total_steps": 40000, "loss": 0.0875, "lr": 0.1687532318038151, "epoch": 0.8992744240588278, "percentage": 46.01, "elapsed_time": "19:31:10", "remaining_time": "22:54:10", "throughput": 331.73, "total_tokens": 23310688} {"current_steps": 18410, "total_steps": 40000, "loss": 0.0773, "lr": 0.16869478766303206, "epoch": 0.8995187257225221, "percentage": 46.02, "elapsed_time": "19:31:13", "remaining_time": "22:53:32", "throughput": 331.8, "total_tokens": 23317120} {"current_steps": 18415, "total_steps": 40000, "loss": 0.0567, "lr": 0.16863634063927788, "epoch": 0.8997630273862165, "percentage": 46.04, "elapsed_time": "19:31:17", "remaining_time": "22:52:54", "throughput": 331.88, "total_tokens": 23323392} {"current_steps": 18420, "total_steps": 40000, "loss": 0.0649, "lr": 0.16857789074156568, "epoch": 0.9000073290499109, "percentage": 46.05, "elapsed_time": "19:31:20", "remaining_time": "22:52:16", "throughput": 331.95, "total_tokens": 23329600} {"current_steps": 18425, "total_steps": 40000, "loss": 0.0577, "lr": 0.16851943797890928, "epoch": 0.9002516307136051, "percentage": 46.06, "elapsed_time": "19:31:23", "remaining_time": "22:51:39", "throughput": 332.03, "total_tokens": 23336096} {"current_steps": 18430, "total_steps": 40000, "loss": 0.058, "lr": 0.16846098236032284, "epoch": 0.9004959323772995, "percentage": 46.08, "elapsed_time": "19:31:26", "remaining_time": "22:51:01", "throughput": 332.1, "total_tokens": 23342336} {"current_steps": 18435, "total_steps": 40000, "loss": 0.0713, "lr": 0.16840252389482097, "epoch": 0.9007402340409938, "percentage": 46.09, "elapsed_time": "19:31:29", "remaining_time": "22:50:23", "throughput": 332.18, "total_tokens": 23348608} {"current_steps": 18440, "total_steps": 40000, "loss": 0.0641, "lr": 0.16834406259141857, "epoch": 0.9009845357046882, "percentage": 46.1, "elapsed_time": "19:31:32", "remaining_time": "22:49:45", "throughput": 332.25, "total_tokens": 23355008} {"current_steps": 18445, "total_steps": 40000, "loss": 0.0474, "lr": 0.16828559845913124, "epoch": 0.9012288373683824, "percentage": 46.11, "elapsed_time": "19:31:35", "remaining_time": "22:49:08", "throughput": 332.33, "total_tokens": 23361632} {"current_steps": 18450, "total_steps": 40000, "loss": 0.0592, "lr": 0.16822713150697488, "epoch": 0.9014731390320768, "percentage": 46.12, "elapsed_time": "19:31:38", "remaining_time": "22:48:30", "throughput": 332.41, "total_tokens": 23368224} {"current_steps": 18455, "total_steps": 40000, "loss": 0.0518, "lr": 0.16816866174396575, "epoch": 0.9017174406957711, "percentage": 46.14, "elapsed_time": "19:31:41", "remaining_time": "22:47:52", "throughput": 332.49, "total_tokens": 23374720} {"current_steps": 18460, "total_steps": 40000, "loss": 0.0947, "lr": 0.16811018917912057, "epoch": 0.9019617423594655, "percentage": 46.15, "elapsed_time": "19:31:45", "remaining_time": "22:47:15", "throughput": 332.57, "total_tokens": 23381152} {"current_steps": 18465, "total_steps": 40000, "loss": 0.041, "lr": 0.16805171382145673, "epoch": 0.9022060440231598, "percentage": 46.16, "elapsed_time": "19:31:48", "remaining_time": "22:46:37", "throughput": 332.64, "total_tokens": 23387584} {"current_steps": 18470, "total_steps": 40000, "loss": 0.0989, "lr": 0.16799323567999175, "epoch": 0.9024503456868541, "percentage": 46.17, "elapsed_time": "19:31:51", "remaining_time": "22:45:59", "throughput": 332.71, "total_tokens": 23393376} {"current_steps": 18475, "total_steps": 40000, "loss": 0.0776, "lr": 0.16793475476374367, "epoch": 0.9026946473505485, "percentage": 46.19, "elapsed_time": "19:31:54", "remaining_time": "22:45:22", "throughput": 332.79, "total_tokens": 23400064} {"current_steps": 18480, "total_steps": 40000, "loss": 0.0755, "lr": 0.1678762710817311, "epoch": 0.9029389490142428, "percentage": 46.2, "elapsed_time": "19:31:57", "remaining_time": "22:44:44", "throughput": 332.86, "total_tokens": 23406176} {"current_steps": 18485, "total_steps": 40000, "loss": 0.082, "lr": 0.1678177846429728, "epoch": 0.9031832506779371, "percentage": 46.21, "elapsed_time": "19:32:00", "remaining_time": "22:44:07", "throughput": 332.94, "total_tokens": 23412768} {"current_steps": 18490, "total_steps": 40000, "loss": 0.0684, "lr": 0.16775929545648827, "epoch": 0.9034275523416314, "percentage": 46.23, "elapsed_time": "19:32:03", "remaining_time": "22:43:29", "throughput": 333.02, "total_tokens": 23418976} {"current_steps": 18495, "total_steps": 40000, "loss": 0.0568, "lr": 0.16770080353129715, "epoch": 0.9036718540053258, "percentage": 46.24, "elapsed_time": "19:32:06", "remaining_time": "22:42:52", "throughput": 333.09, "total_tokens": 23425120} {"current_steps": 18500, "total_steps": 40000, "loss": 0.0636, "lr": 0.16764230887641968, "epoch": 0.9039161556690201, "percentage": 46.25, "elapsed_time": "19:32:09", "remaining_time": "22:42:14", "throughput": 333.16, "total_tokens": 23431328} {"current_steps": 18505, "total_steps": 40000, "loss": 0.0496, "lr": 0.1675838115008765, "epoch": 0.9041604573327144, "percentage": 46.26, "elapsed_time": "19:32:12", "remaining_time": "22:41:36", "throughput": 333.24, "total_tokens": 23437376} {"current_steps": 18510, "total_steps": 40000, "loss": 0.0748, "lr": 0.1675253114136886, "epoch": 0.9044047589964088, "percentage": 46.27, "elapsed_time": "19:32:15", "remaining_time": "22:40:59", "throughput": 333.31, "total_tokens": 23443648} {"current_steps": 18515, "total_steps": 40000, "loss": 0.0982, "lr": 0.16746680862387747, "epoch": 0.9046490606601031, "percentage": 46.29, "elapsed_time": "19:32:18", "remaining_time": "22:40:21", "throughput": 333.38, "total_tokens": 23449536} {"current_steps": 18520, "total_steps": 40000, "loss": 0.0878, "lr": 0.16740830314046493, "epoch": 0.9048933623237975, "percentage": 46.3, "elapsed_time": "19:32:21", "remaining_time": "22:39:44", "throughput": 333.45, "total_tokens": 23455840} {"current_steps": 18525, "total_steps": 40000, "loss": 0.074, "lr": 0.1673497949724733, "epoch": 0.9051376639874917, "percentage": 46.31, "elapsed_time": "19:32:25", "remaining_time": "22:39:07", "throughput": 333.54, "total_tokens": 23462560} {"current_steps": 18530, "total_steps": 40000, "loss": 0.0679, "lr": 0.16729128412892522, "epoch": 0.9053819656511861, "percentage": 46.33, "elapsed_time": "19:32:28", "remaining_time": "22:38:29", "throughput": 333.62, "total_tokens": 23469376} {"current_steps": 18535, "total_steps": 40000, "loss": 0.0591, "lr": 0.16723277061884384, "epoch": 0.9056262673148804, "percentage": 46.34, "elapsed_time": "19:32:31", "remaining_time": "22:37:52", "throughput": 333.7, "total_tokens": 23476096} {"current_steps": 18540, "total_steps": 40000, "loss": 0.048, "lr": 0.16717425445125267, "epoch": 0.9058705689785748, "percentage": 46.35, "elapsed_time": "19:32:34", "remaining_time": "22:37:15", "throughput": 333.78, "total_tokens": 23482592} {"current_steps": 18545, "total_steps": 40000, "loss": 0.0638, "lr": 0.16711573563517565, "epoch": 0.906114870642269, "percentage": 46.36, "elapsed_time": "19:32:37", "remaining_time": "22:36:37", "throughput": 333.85, "total_tokens": 23488704} {"current_steps": 18550, "total_steps": 40000, "loss": 0.0479, "lr": 0.1670572141796371, "epoch": 0.9063591723059634, "percentage": 46.38, "elapsed_time": "19:32:40", "remaining_time": "22:36:00", "throughput": 333.92, "total_tokens": 23495008} {"current_steps": 18555, "total_steps": 40000, "loss": 0.0689, "lr": 0.16699869009366175, "epoch": 0.9066034739696577, "percentage": 46.39, "elapsed_time": "19:32:43", "remaining_time": "22:35:23", "throughput": 334.0, "total_tokens": 23501152} {"current_steps": 18560, "total_steps": 40000, "loss": 0.0832, "lr": 0.1669401633862748, "epoch": 0.9068477756333521, "percentage": 46.4, "elapsed_time": "19:32:46", "remaining_time": "22:34:45", "throughput": 334.07, "total_tokens": 23507328} {"current_steps": 18565, "total_steps": 40000, "loss": 0.0703, "lr": 0.16688163406650178, "epoch": 0.9070920772970464, "percentage": 46.41, "elapsed_time": "19:32:49", "remaining_time": "22:34:08", "throughput": 334.14, "total_tokens": 23513472} {"current_steps": 18570, "total_steps": 40000, "loss": 0.0422, "lr": 0.1668231021433686, "epoch": 0.9073363789607407, "percentage": 46.42, "elapsed_time": "19:32:52", "remaining_time": "22:33:31", "throughput": 334.22, "total_tokens": 23520160} {"current_steps": 18575, "total_steps": 40000, "loss": 0.0415, "lr": 0.1667645676259017, "epoch": 0.9075806806244351, "percentage": 46.44, "elapsed_time": "19:32:56", "remaining_time": "22:32:53", "throughput": 334.3, "total_tokens": 23526496} {"current_steps": 18580, "total_steps": 40000, "loss": 0.0712, "lr": 0.1667060305231277, "epoch": 0.9078249822881294, "percentage": 46.45, "elapsed_time": "19:32:58", "remaining_time": "22:32:16", "throughput": 334.37, "total_tokens": 23532352} {"current_steps": 18585, "total_steps": 40000, "loss": 0.0587, "lr": 0.16664749084407396, "epoch": 0.9080692839518237, "percentage": 46.46, "elapsed_time": "19:33:02", "remaining_time": "22:31:39", "throughput": 334.44, "total_tokens": 23538592} {"current_steps": 18590, "total_steps": 40000, "loss": 0.08, "lr": 0.16658894859776788, "epoch": 0.908313585615518, "percentage": 46.48, "elapsed_time": "19:33:05", "remaining_time": "22:31:02", "throughput": 334.51, "total_tokens": 23544704} {"current_steps": 18595, "total_steps": 40000, "loss": 0.0652, "lr": 0.16653040379323752, "epoch": 0.9085578872792124, "percentage": 46.49, "elapsed_time": "19:33:08", "remaining_time": "22:30:24", "throughput": 334.58, "total_tokens": 23550688} {"current_steps": 18600, "total_steps": 40000, "loss": 0.047, "lr": 0.16647185643951107, "epoch": 0.9088021889429067, "percentage": 46.5, "elapsed_time": "19:33:11", "remaining_time": "22:29:47", "throughput": 334.66, "total_tokens": 23557152} {"current_steps": 18600, "total_steps": 40000, "eval_loss": 0.06748455762863159, "epoch": 0.9088021889429067, "percentage": 46.5, "elapsed_time": "19:43:51", "remaining_time": "22:42:04", "throughput": 331.64, "total_tokens": 23557152} {"current_steps": 18605, "total_steps": 40000, "loss": 0.0713, "lr": 0.1664133065456174, "epoch": 0.909046490606601, "percentage": 46.51, "elapsed_time": "19:43:55", "remaining_time": "22:41:27", "throughput": 331.71, "total_tokens": 23563424} {"current_steps": 18610, "total_steps": 40000, "loss": 0.0414, "lr": 0.1663547541205856, "epoch": 0.9092907922702954, "percentage": 46.52, "elapsed_time": "19:43:58", "remaining_time": "22:40:50", "throughput": 331.78, "total_tokens": 23569312} {"current_steps": 18615, "total_steps": 40000, "loss": 0.0579, "lr": 0.16629619917344518, "epoch": 0.9095350939339897, "percentage": 46.54, "elapsed_time": "19:44:01", "remaining_time": "22:40:12", "throughput": 331.86, "total_tokens": 23575776} {"current_steps": 18620, "total_steps": 40000, "loss": 0.1095, "lr": 0.16623764171322605, "epoch": 0.9097793955976841, "percentage": 46.55, "elapsed_time": "19:44:04", "remaining_time": "22:39:35", "throughput": 331.94, "total_tokens": 23582368} {"current_steps": 18625, "total_steps": 40000, "loss": 0.0326, "lr": 0.1661790817489585, "epoch": 0.9100236972613783, "percentage": 46.56, "elapsed_time": "19:44:07", "remaining_time": "22:38:57", "throughput": 332.01, "total_tokens": 23588672} {"current_steps": 18630, "total_steps": 40000, "loss": 0.0848, "lr": 0.16612051928967328, "epoch": 0.9102679989250727, "percentage": 46.58, "elapsed_time": "19:44:10", "remaining_time": "22:38:20", "throughput": 332.08, "total_tokens": 23594688} {"current_steps": 18635, "total_steps": 40000, "loss": 0.0484, "lr": 0.16606195434440138, "epoch": 0.910512300588767, "percentage": 46.59, "elapsed_time": "19:44:13", "remaining_time": "22:37:43", "throughput": 332.17, "total_tokens": 23601696} {"current_steps": 18640, "total_steps": 40000, "loss": 0.0637, "lr": 0.16600338692217426, "epoch": 0.9107566022524614, "percentage": 46.6, "elapsed_time": "19:44:16", "remaining_time": "22:37:05", "throughput": 332.24, "total_tokens": 23607904} {"current_steps": 18645, "total_steps": 40000, "loss": 0.0794, "lr": 0.16594481703202374, "epoch": 0.9110009039161556, "percentage": 46.61, "elapsed_time": "19:44:20", "remaining_time": "22:36:28", "throughput": 332.32, "total_tokens": 23614592} {"current_steps": 18650, "total_steps": 40000, "loss": 0.0694, "lr": 0.1658862446829821, "epoch": 0.91124520557985, "percentage": 46.62, "elapsed_time": "19:44:23", "remaining_time": "22:35:51", "throughput": 332.39, "total_tokens": 23620960} {"current_steps": 18655, "total_steps": 40000, "loss": 0.0667, "lr": 0.16582766988408187, "epoch": 0.9114895072435444, "percentage": 46.64, "elapsed_time": "19:44:26", "remaining_time": "22:35:13", "throughput": 332.47, "total_tokens": 23627072} {"current_steps": 18660, "total_steps": 40000, "loss": 0.0766, "lr": 0.16576909264435608, "epoch": 0.9117338089072387, "percentage": 46.65, "elapsed_time": "19:44:29", "remaining_time": "22:34:36", "throughput": 332.54, "total_tokens": 23633504} {"current_steps": 18665, "total_steps": 40000, "loss": 0.0767, "lr": 0.16571051297283798, "epoch": 0.911978110570933, "percentage": 46.66, "elapsed_time": "19:44:32", "remaining_time": "22:33:59", "throughput": 332.62, "total_tokens": 23639904} {"current_steps": 18670, "total_steps": 40000, "loss": 0.089, "lr": 0.16565193087856137, "epoch": 0.9122224122346273, "percentage": 46.67, "elapsed_time": "19:44:35", "remaining_time": "22:33:22", "throughput": 332.69, "total_tokens": 23646336} {"current_steps": 18675, "total_steps": 40000, "loss": 0.0606, "lr": 0.16559334637056033, "epoch": 0.9124667138983217, "percentage": 46.69, "elapsed_time": "19:44:38", "remaining_time": "22:32:44", "throughput": 332.76, "total_tokens": 23652320} {"current_steps": 18680, "total_steps": 40000, "loss": 0.0715, "lr": 0.16553475945786933, "epoch": 0.912711015562016, "percentage": 46.7, "elapsed_time": "19:44:41", "remaining_time": "22:32:07", "throughput": 332.84, "total_tokens": 23658464} {"current_steps": 18685, "total_steps": 40000, "loss": 0.0733, "lr": 0.16547617014952318, "epoch": 0.9129553172257103, "percentage": 46.71, "elapsed_time": "19:44:44", "remaining_time": "22:31:30", "throughput": 332.91, "total_tokens": 23664448} {"current_steps": 18690, "total_steps": 40000, "loss": 0.1014, "lr": 0.1654175784545571, "epoch": 0.9131996188894046, "percentage": 46.73, "elapsed_time": "19:44:47", "remaining_time": "22:30:52", "throughput": 332.97, "total_tokens": 23670112} {"current_steps": 18695, "total_steps": 40000, "loss": 0.0646, "lr": 0.1653589843820067, "epoch": 0.913443920553099, "percentage": 46.74, "elapsed_time": "19:44:50", "remaining_time": "22:30:15", "throughput": 333.04, "total_tokens": 23676352} {"current_steps": 18700, "total_steps": 40000, "loss": 0.0717, "lr": 0.1653003879409079, "epoch": 0.9136882222167932, "percentage": 46.75, "elapsed_time": "19:44:53", "remaining_time": "22:29:38", "throughput": 333.12, "total_tokens": 23682688} {"current_steps": 18705, "total_steps": 40000, "loss": 0.0587, "lr": 0.165241789140297, "epoch": 0.9139325238804876, "percentage": 46.76, "elapsed_time": "19:44:56", "remaining_time": "22:29:01", "throughput": 333.19, "total_tokens": 23688736} {"current_steps": 18710, "total_steps": 40000, "loss": 0.0538, "lr": 0.16518318798921064, "epoch": 0.914176825544182, "percentage": 46.77, "elapsed_time": "19:44:59", "remaining_time": "22:28:23", "throughput": 333.26, "total_tokens": 23694816} {"current_steps": 18715, "total_steps": 40000, "loss": 0.0659, "lr": 0.16512458449668593, "epoch": 0.9144211272078763, "percentage": 46.79, "elapsed_time": "19:45:02", "remaining_time": "22:27:46", "throughput": 333.33, "total_tokens": 23700800} {"current_steps": 18720, "total_steps": 40000, "loss": 0.0557, "lr": 0.1650659786717602, "epoch": 0.9146654288715707, "percentage": 46.8, "elapsed_time": "19:45:05", "remaining_time": "22:27:09", "throughput": 333.41, "total_tokens": 23707584} {"current_steps": 18725, "total_steps": 40000, "loss": 0.0838, "lr": 0.1650073705234712, "epoch": 0.9149097305352649, "percentage": 46.81, "elapsed_time": "19:45:09", "remaining_time": "22:26:32", "throughput": 333.49, "total_tokens": 23714240} {"current_steps": 18730, "total_steps": 40000, "loss": 0.0551, "lr": 0.16494876006085712, "epoch": 0.9151540321989593, "percentage": 46.83, "elapsed_time": "19:45:12", "remaining_time": "22:25:55", "throughput": 333.56, "total_tokens": 23720384} {"current_steps": 18735, "total_steps": 40000, "loss": 0.0434, "lr": 0.16489014729295634, "epoch": 0.9153983338626536, "percentage": 46.84, "elapsed_time": "19:45:15", "remaining_time": "22:25:18", "throughput": 333.64, "total_tokens": 23727008} {"current_steps": 18740, "total_steps": 40000, "loss": 0.0666, "lr": 0.16483153222880775, "epoch": 0.915642635526348, "percentage": 46.85, "elapsed_time": "19:45:18", "remaining_time": "22:24:41", "throughput": 333.72, "total_tokens": 23733696} {"current_steps": 18745, "total_steps": 40000, "loss": 0.0667, "lr": 0.16477291487745052, "epoch": 0.9158869371900422, "percentage": 46.86, "elapsed_time": "19:45:21", "remaining_time": "22:24:04", "throughput": 333.79, "total_tokens": 23739872} {"current_steps": 18750, "total_steps": 40000, "loss": 0.0514, "lr": 0.16471429524792416, "epoch": 0.9161312388537366, "percentage": 46.88, "elapsed_time": "19:45:24", "remaining_time": "22:23:27", "throughput": 333.86, "total_tokens": 23745952} {"current_steps": 18755, "total_steps": 40000, "loss": 0.0635, "lr": 0.16465567334926856, "epoch": 0.916375540517431, "percentage": 46.89, "elapsed_time": "19:45:27", "remaining_time": "22:22:50", "throughput": 333.94, "total_tokens": 23752096} {"current_steps": 18760, "total_steps": 40000, "loss": 0.0642, "lr": 0.16459704919052395, "epoch": 0.9166198421811252, "percentage": 46.9, "elapsed_time": "19:45:30", "remaining_time": "22:22:13", "throughput": 334.01, "total_tokens": 23758336} {"current_steps": 18765, "total_steps": 40000, "loss": 0.0389, "lr": 0.16453842278073086, "epoch": 0.9168641438448196, "percentage": 46.91, "elapsed_time": "19:45:33", "remaining_time": "22:21:36", "throughput": 334.1, "total_tokens": 23765472} {"current_steps": 18770, "total_steps": 40000, "loss": 0.053, "lr": 0.16447979412893038, "epoch": 0.9171084455085139, "percentage": 46.92, "elapsed_time": "19:45:36", "remaining_time": "22:21:00", "throughput": 334.17, "total_tokens": 23771840} {"current_steps": 18775, "total_steps": 40000, "loss": 0.0652, "lr": 0.16442116324416367, "epoch": 0.9173527471722083, "percentage": 46.94, "elapsed_time": "19:45:39", "remaining_time": "22:20:23", "throughput": 334.25, "total_tokens": 23778304} {"current_steps": 18780, "total_steps": 40000, "loss": 0.0778, "lr": 0.1643625301354723, "epoch": 0.9175970488359025, "percentage": 46.95, "elapsed_time": "19:45:43", "remaining_time": "22:19:46", "throughput": 334.32, "total_tokens": 23784704} {"current_steps": 18785, "total_steps": 40000, "loss": 0.0631, "lr": 0.16430389481189828, "epoch": 0.9178413504995969, "percentage": 46.96, "elapsed_time": "19:45:46", "remaining_time": "22:19:09", "throughput": 334.39, "total_tokens": 23790560} {"current_steps": 18790, "total_steps": 40000, "loss": 0.0656, "lr": 0.164245257282484, "epoch": 0.9180856521632912, "percentage": 46.98, "elapsed_time": "19:45:49", "remaining_time": "22:18:32", "throughput": 334.46, "total_tokens": 23796640} {"current_steps": 18795, "total_steps": 40000, "loss": 0.0359, "lr": 0.16418661755627195, "epoch": 0.9183299538269856, "percentage": 46.99, "elapsed_time": "19:45:52", "remaining_time": "22:17:55", "throughput": 334.53, "total_tokens": 23802752} {"current_steps": 18800, "total_steps": 40000, "loss": 0.0844, "lr": 0.16412797564230527, "epoch": 0.9185742554906798, "percentage": 47.0, "elapsed_time": "19:45:55", "remaining_time": "22:17:18", "throughput": 334.61, "total_tokens": 23808960} {"current_steps": 18800, "total_steps": 40000, "eval_loss": 0.06541521847248077, "epoch": 0.9185742554906798, "percentage": 47.0, "elapsed_time": "19:56:35", "remaining_time": "22:29:20", "throughput": 331.62, "total_tokens": 23808960} {"current_steps": 18805, "total_steps": 40000, "loss": 0.0486, "lr": 0.16406933154962713, "epoch": 0.9188185571543742, "percentage": 47.01, "elapsed_time": "19:56:39", "remaining_time": "22:28:44", "throughput": 331.69, "total_tokens": 23815328} {"current_steps": 18810, "total_steps": 40000, "loss": 0.0497, "lr": 0.16401068528728133, "epoch": 0.9190628588180686, "percentage": 47.02, "elapsed_time": "19:56:42", "remaining_time": "22:28:07", "throughput": 331.77, "total_tokens": 23821632} {"current_steps": 18815, "total_steps": 40000, "loss": 0.0778, "lr": 0.16395203686431173, "epoch": 0.9193071604817629, "percentage": 47.04, "elapsed_time": "19:56:45", "remaining_time": "22:27:30", "throughput": 331.84, "total_tokens": 23827936} {"current_steps": 18820, "total_steps": 40000, "loss": 0.0766, "lr": 0.16389338628976277, "epoch": 0.9195514621454572, "percentage": 47.05, "elapsed_time": "19:56:48", "remaining_time": "22:26:53", "throughput": 331.91, "total_tokens": 23834144} {"current_steps": 18825, "total_steps": 40000, "loss": 0.0773, "lr": 0.163834733572679, "epoch": 0.9197957638091515, "percentage": 47.06, "elapsed_time": "19:56:51", "remaining_time": "22:26:16", "throughput": 331.99, "total_tokens": 23840384} {"current_steps": 18830, "total_steps": 40000, "loss": 0.0896, "lr": 0.16377607872210545, "epoch": 0.9200400654728459, "percentage": 47.08, "elapsed_time": "19:56:54", "remaining_time": "22:25:39", "throughput": 332.06, "total_tokens": 23846976} {"current_steps": 18835, "total_steps": 40000, "loss": 0.0615, "lr": 0.16371742174708748, "epoch": 0.9202843671365402, "percentage": 47.09, "elapsed_time": "19:56:57", "remaining_time": "22:25:01", "throughput": 332.13, "total_tokens": 23852960} {"current_steps": 18840, "total_steps": 40000, "loss": 0.0666, "lr": 0.16365876265667065, "epoch": 0.9205286688002345, "percentage": 47.1, "elapsed_time": "19:57:00", "remaining_time": "22:24:24", "throughput": 332.2, "total_tokens": 23859008} {"current_steps": 18845, "total_steps": 40000, "loss": 0.0455, "lr": 0.163600101459901, "epoch": 0.9207729704639288, "percentage": 47.11, "elapsed_time": "19:57:03", "remaining_time": "22:23:47", "throughput": 332.28, "total_tokens": 23865792} {"current_steps": 18850, "total_steps": 40000, "loss": 0.0434, "lr": 0.16354143816582484, "epoch": 0.9210172721276232, "percentage": 47.12, "elapsed_time": "19:57:07", "remaining_time": "22:23:11", "throughput": 332.36, "total_tokens": 23872512} {"current_steps": 18855, "total_steps": 40000, "loss": 0.0762, "lr": 0.1634827727834887, "epoch": 0.9212615737913176, "percentage": 47.14, "elapsed_time": "19:57:10", "remaining_time": "22:22:34", "throughput": 332.44, "total_tokens": 23878912} {"current_steps": 18860, "total_steps": 40000, "loss": 0.0489, "lr": 0.16342410532193954, "epoch": 0.9215058754550118, "percentage": 47.15, "elapsed_time": "19:57:13", "remaining_time": "22:21:57", "throughput": 332.51, "total_tokens": 23885248} {"current_steps": 18865, "total_steps": 40000, "loss": 0.0956, "lr": 0.16336543579022464, "epoch": 0.9217501771187062, "percentage": 47.16, "elapsed_time": "19:57:16", "remaining_time": "22:21:20", "throughput": 332.59, "total_tokens": 23892160} {"current_steps": 18870, "total_steps": 40000, "loss": 0.0634, "lr": 0.16330676419739157, "epoch": 0.9219944787824005, "percentage": 47.17, "elapsed_time": "19:57:19", "remaining_time": "22:20:43", "throughput": 332.66, "total_tokens": 23898272} {"current_steps": 18875, "total_steps": 40000, "loss": 0.0935, "lr": 0.1632480905524883, "epoch": 0.9222387804460949, "percentage": 47.19, "elapsed_time": "19:57:22", "remaining_time": "22:20:06", "throughput": 332.74, "total_tokens": 23904576} {"current_steps": 18880, "total_steps": 40000, "loss": 0.0567, "lr": 0.16318941486456293, "epoch": 0.9224830821097891, "percentage": 47.2, "elapsed_time": "19:57:25", "remaining_time": "22:19:29", "throughput": 332.81, "total_tokens": 23911296} {"current_steps": 18885, "total_steps": 40000, "loss": 0.0934, "lr": 0.16313073714266405, "epoch": 0.9227273837734835, "percentage": 47.21, "elapsed_time": "19:57:28", "remaining_time": "22:18:53", "throughput": 332.88, "total_tokens": 23917216} {"current_steps": 18890, "total_steps": 40000, "loss": 0.05, "lr": 0.16307205739584052, "epoch": 0.9229716854371778, "percentage": 47.23, "elapsed_time": "19:57:32", "remaining_time": "22:18:16", "throughput": 332.96, "total_tokens": 23923680} {"current_steps": 18895, "total_steps": 40000, "loss": 0.047, "lr": 0.16301337563314144, "epoch": 0.9232159871008722, "percentage": 47.24, "elapsed_time": "19:57:35", "remaining_time": "22:17:39", "throughput": 333.03, "total_tokens": 23930272} {"current_steps": 18900, "total_steps": 40000, "loss": 0.0724, "lr": 0.1629546918636163, "epoch": 0.9234602887645665, "percentage": 47.25, "elapsed_time": "19:57:38", "remaining_time": "22:17:02", "throughput": 333.11, "total_tokens": 23936640} {"current_steps": 18905, "total_steps": 40000, "loss": 0.0492, "lr": 0.16289600609631485, "epoch": 0.9237045904282608, "percentage": 47.26, "elapsed_time": "19:57:41", "remaining_time": "22:16:25", "throughput": 333.19, "total_tokens": 23943168} {"current_steps": 18910, "total_steps": 40000, "loss": 0.0614, "lr": 0.16283731834028722, "epoch": 0.9239488920919552, "percentage": 47.27, "elapsed_time": "19:57:44", "remaining_time": "22:15:49", "throughput": 333.26, "total_tokens": 23949792} {"current_steps": 18915, "total_steps": 40000, "loss": 0.0644, "lr": 0.16277862860458378, "epoch": 0.9241931937556495, "percentage": 47.29, "elapsed_time": "19:57:47", "remaining_time": "22:15:12", "throughput": 333.34, "total_tokens": 23956128} {"current_steps": 18920, "total_steps": 40000, "loss": 0.0522, "lr": 0.16271993689825526, "epoch": 0.9244374954193438, "percentage": 47.3, "elapsed_time": "19:57:50", "remaining_time": "22:14:35", "throughput": 333.41, "total_tokens": 23962240} {"current_steps": 18925, "total_steps": 40000, "loss": 0.0523, "lr": 0.1626612432303526, "epoch": 0.9246817970830381, "percentage": 47.31, "elapsed_time": "19:57:53", "remaining_time": "22:13:59", "throughput": 333.48, "total_tokens": 23968672} {"current_steps": 18930, "total_steps": 40000, "loss": 0.0889, "lr": 0.1626025476099271, "epoch": 0.9249260987467325, "percentage": 47.33, "elapsed_time": "19:57:56", "remaining_time": "22:13:22", "throughput": 333.55, "total_tokens": 23974560} {"current_steps": 18935, "total_steps": 40000, "loss": 0.0831, "lr": 0.1625438500460304, "epoch": 0.9251704004104268, "percentage": 47.34, "elapsed_time": "19:57:59", "remaining_time": "22:12:45", "throughput": 333.63, "total_tokens": 23981184} {"current_steps": 18940, "total_steps": 40000, "loss": 0.0598, "lr": 0.16248515054771442, "epoch": 0.9254147020741211, "percentage": 47.35, "elapsed_time": "19:58:03", "remaining_time": "22:12:09", "throughput": 333.7, "total_tokens": 23987360} {"current_steps": 18945, "total_steps": 40000, "loss": 0.0809, "lr": 0.16242644912403123, "epoch": 0.9256590037378154, "percentage": 47.36, "elapsed_time": "19:58:06", "remaining_time": "22:11:32", "throughput": 333.77, "total_tokens": 23993472} {"current_steps": 18950, "total_steps": 40000, "loss": 0.0688, "lr": 0.1623677457840335, "epoch": 0.9259033054015098, "percentage": 47.38, "elapsed_time": "19:58:09", "remaining_time": "22:10:55", "throughput": 333.85, "total_tokens": 23999872} {"current_steps": 18955, "total_steps": 40000, "loss": 0.0504, "lr": 0.16230904053677397, "epoch": 0.9261476070652042, "percentage": 47.39, "elapsed_time": "19:58:12", "remaining_time": "22:10:19", "throughput": 333.92, "total_tokens": 24006112} {"current_steps": 18960, "total_steps": 40000, "loss": 0.0946, "lr": 0.16225033339130568, "epoch": 0.9263919087288984, "percentage": 47.4, "elapsed_time": "19:58:15", "remaining_time": "22:09:42", "throughput": 333.99, "total_tokens": 24012320} {"current_steps": 18965, "total_steps": 40000, "loss": 0.0624, "lr": 0.16219162435668197, "epoch": 0.9266362103925928, "percentage": 47.41, "elapsed_time": "19:58:18", "remaining_time": "22:09:05", "throughput": 334.06, "total_tokens": 24018496} {"current_steps": 18970, "total_steps": 40000, "loss": 0.0701, "lr": 0.16213291344195666, "epoch": 0.9268805120562871, "percentage": 47.42, "elapsed_time": "19:58:21", "remaining_time": "22:08:29", "throughput": 334.14, "total_tokens": 24024864} {"current_steps": 18975, "total_steps": 40000, "loss": 0.069, "lr": 0.16207420065618358, "epoch": 0.9271248137199815, "percentage": 47.44, "elapsed_time": "19:58:24", "remaining_time": "22:07:52", "throughput": 334.21, "total_tokens": 24031296} {"current_steps": 18980, "total_steps": 40000, "loss": 0.096, "lr": 0.16201548600841706, "epoch": 0.9273691153836757, "percentage": 47.45, "elapsed_time": "19:58:27", "remaining_time": "22:07:16", "throughput": 334.29, "total_tokens": 24038112} {"current_steps": 18985, "total_steps": 40000, "loss": 0.0784, "lr": 0.16195676950771154, "epoch": 0.9276134170473701, "percentage": 47.46, "elapsed_time": "19:58:30", "remaining_time": "22:06:40", "throughput": 334.37, "total_tokens": 24045024} {"current_steps": 18990, "total_steps": 40000, "loss": 0.0543, "lr": 0.16189805116312198, "epoch": 0.9278577187110644, "percentage": 47.48, "elapsed_time": "19:58:33", "remaining_time": "22:06:03", "throughput": 334.44, "total_tokens": 24051200} {"current_steps": 18995, "total_steps": 40000, "loss": 0.0673, "lr": 0.16183933098370337, "epoch": 0.9281020203747588, "percentage": 47.49, "elapsed_time": "19:58:37", "remaining_time": "22:05:27", "throughput": 334.52, "total_tokens": 24057632} {"current_steps": 19000, "total_steps": 40000, "loss": 0.0783, "lr": 0.16178060897851115, "epoch": 0.9283463220384531, "percentage": 47.5, "elapsed_time": "19:58:40", "remaining_time": "22:04:50", "throughput": 334.59, "total_tokens": 24063776} {"current_steps": 19000, "total_steps": 40000, "eval_loss": 0.06752932816743851, "epoch": 0.9283463220384531, "percentage": 47.5, "elapsed_time": "20:09:20", "remaining_time": "22:16:38", "throughput": 331.64, "total_tokens": 24063776} {"current_steps": 19005, "total_steps": 40000, "loss": 0.0592, "lr": 0.16172188515660096, "epoch": 0.9285906237021474, "percentage": 47.51, "elapsed_time": "20:09:24", "remaining_time": "22:16:02", "throughput": 331.71, "total_tokens": 24070432} {"current_steps": 19010, "total_steps": 40000, "loss": 0.0634, "lr": 0.16166315952702878, "epoch": 0.9288349253658418, "percentage": 47.52, "elapsed_time": "20:09:27", "remaining_time": "22:15:25", "throughput": 331.78, "total_tokens": 24076768} {"current_steps": 19015, "total_steps": 40000, "loss": 0.0641, "lr": 0.16160443209885084, "epoch": 0.929079227029536, "percentage": 47.54, "elapsed_time": "20:09:30", "remaining_time": "22:14:48", "throughput": 331.86, "total_tokens": 24083104} {"current_steps": 19020, "total_steps": 40000, "loss": 0.0538, "lr": 0.16154570288112363, "epoch": 0.9293235286932304, "percentage": 47.55, "elapsed_time": "20:09:33", "remaining_time": "22:14:12", "throughput": 331.94, "total_tokens": 24089984} {"current_steps": 19025, "total_steps": 40000, "loss": 0.0574, "lr": 0.16148697188290395, "epoch": 0.9295678303569247, "percentage": 47.56, "elapsed_time": "20:09:36", "remaining_time": "22:13:35", "throughput": 332.01, "total_tokens": 24096064} {"current_steps": 19030, "total_steps": 40000, "loss": 0.0711, "lr": 0.16142823911324888, "epoch": 0.9298121320206191, "percentage": 47.58, "elapsed_time": "20:09:39", "remaining_time": "22:12:58", "throughput": 332.09, "total_tokens": 24102816} {"current_steps": 19035, "total_steps": 40000, "loss": 0.0612, "lr": 0.16136950458121568, "epoch": 0.9300564336843133, "percentage": 47.59, "elapsed_time": "20:09:42", "remaining_time": "22:12:22", "throughput": 332.16, "total_tokens": 24108928} {"current_steps": 19040, "total_steps": 40000, "loss": 0.0441, "lr": 0.16131076829586205, "epoch": 0.9303007353480077, "percentage": 47.6, "elapsed_time": "20:09:45", "remaining_time": "22:11:45", "throughput": 332.23, "total_tokens": 24115200} {"current_steps": 19045, "total_steps": 40000, "loss": 0.0496, "lr": 0.1612520302662457, "epoch": 0.9305450370117021, "percentage": 47.61, "elapsed_time": "20:09:49", "remaining_time": "22:11:08", "throughput": 332.3, "total_tokens": 24121248} {"current_steps": 19050, "total_steps": 40000, "loss": 0.0439, "lr": 0.16119329050142497, "epoch": 0.9307893386753964, "percentage": 47.62, "elapsed_time": "20:09:52", "remaining_time": "22:10:32", "throughput": 332.38, "total_tokens": 24127968} {"current_steps": 19055, "total_steps": 40000, "loss": 0.0617, "lr": 0.16113454901045818, "epoch": 0.9310336403390908, "percentage": 47.64, "elapsed_time": "20:09:55", "remaining_time": "22:09:55", "throughput": 332.45, "total_tokens": 24134208} {"current_steps": 19060, "total_steps": 40000, "loss": 0.0606, "lr": 0.16107580580240397, "epoch": 0.931277942002785, "percentage": 47.65, "elapsed_time": "20:09:58", "remaining_time": "22:09:19", "throughput": 332.52, "total_tokens": 24140416} {"current_steps": 19065, "total_steps": 40000, "loss": 0.0344, "lr": 0.16101706088632134, "epoch": 0.9315222436664794, "percentage": 47.66, "elapsed_time": "20:10:01", "remaining_time": "22:08:42", "throughput": 332.6, "total_tokens": 24147264} {"current_steps": 19070, "total_steps": 40000, "loss": 0.0682, "lr": 0.16095831427126947, "epoch": 0.9317665453301737, "percentage": 47.67, "elapsed_time": "20:10:04", "remaining_time": "22:08:06", "throughput": 332.68, "total_tokens": 24153856} {"current_steps": 19075, "total_steps": 40000, "loss": 0.0696, "lr": 0.16089956596630783, "epoch": 0.932010846993868, "percentage": 47.69, "elapsed_time": "20:10:07", "remaining_time": "22:07:29", "throughput": 332.75, "total_tokens": 24159968} {"current_steps": 19080, "total_steps": 40000, "loss": 0.0402, "lr": 0.16084081598049618, "epoch": 0.9322551486575623, "percentage": 47.7, "elapsed_time": "20:10:10", "remaining_time": "22:06:53", "throughput": 332.82, "total_tokens": 24166464} {"current_steps": 19085, "total_steps": 40000, "loss": 0.05, "lr": 0.1607820643228944, "epoch": 0.9324994503212567, "percentage": 47.71, "elapsed_time": "20:10:14", "remaining_time": "22:06:16", "throughput": 332.9, "total_tokens": 24172928} {"current_steps": 19090, "total_steps": 40000, "loss": 0.0669, "lr": 0.16072331100256285, "epoch": 0.932743751984951, "percentage": 47.73, "elapsed_time": "20:10:17", "remaining_time": "22:05:40", "throughput": 332.97, "total_tokens": 24179136} {"current_steps": 19095, "total_steps": 40000, "loss": 0.0572, "lr": 0.16066455602856197, "epoch": 0.9329880536486453, "percentage": 47.74, "elapsed_time": "20:10:20", "remaining_time": "22:05:03", "throughput": 333.04, "total_tokens": 24185312} {"current_steps": 19100, "total_steps": 40000, "loss": 0.0886, "lr": 0.16060579940995257, "epoch": 0.9332323553123397, "percentage": 47.75, "elapsed_time": "20:10:23", "remaining_time": "22:04:27", "throughput": 333.11, "total_tokens": 24191328} {"current_steps": 19105, "total_steps": 40000, "loss": 0.0775, "lr": 0.16054704115579557, "epoch": 0.933476656976034, "percentage": 47.76, "elapsed_time": "20:10:26", "remaining_time": "22:03:50", "throughput": 333.18, "total_tokens": 24197472} {"current_steps": 19110, "total_steps": 40000, "loss": 0.0557, "lr": 0.1604882812751523, "epoch": 0.9337209586397284, "percentage": 47.77, "elapsed_time": "20:10:29", "remaining_time": "22:03:14", "throughput": 333.25, "total_tokens": 24203808} {"current_steps": 19115, "total_steps": 40000, "loss": 0.0507, "lr": 0.16042951977708425, "epoch": 0.9339652603034226, "percentage": 47.79, "elapsed_time": "20:10:32", "remaining_time": "22:02:38", "throughput": 333.33, "total_tokens": 24210368} {"current_steps": 19120, "total_steps": 40000, "loss": 0.0591, "lr": 0.16037075667065318, "epoch": 0.934209561967117, "percentage": 47.8, "elapsed_time": "20:10:35", "remaining_time": "22:02:01", "throughput": 333.4, "total_tokens": 24216640} {"current_steps": 19125, "total_steps": 40000, "loss": 0.0581, "lr": 0.1603119919649211, "epoch": 0.9344538636308113, "percentage": 47.81, "elapsed_time": "20:10:38", "remaining_time": "22:01:25", "throughput": 333.47, "total_tokens": 24222944} {"current_steps": 19130, "total_steps": 40000, "loss": 0.0673, "lr": 0.16025322566895028, "epoch": 0.9346981652945057, "percentage": 47.83, "elapsed_time": "20:10:41", "remaining_time": "22:00:49", "throughput": 333.55, "total_tokens": 24229472} {"current_steps": 19135, "total_steps": 40000, "loss": 0.0695, "lr": 0.16019445779180322, "epoch": 0.9349424669581999, "percentage": 47.84, "elapsed_time": "20:10:44", "remaining_time": "22:00:12", "throughput": 333.61, "total_tokens": 24235328} {"current_steps": 19140, "total_steps": 40000, "loss": 0.0634, "lr": 0.16013568834254271, "epoch": 0.9351867686218943, "percentage": 47.85, "elapsed_time": "20:10:47", "remaining_time": "21:59:36", "throughput": 333.69, "total_tokens": 24241504} {"current_steps": 19145, "total_steps": 40000, "loss": 0.0853, "lr": 0.1600769173302316, "epoch": 0.9354310702855887, "percentage": 47.86, "elapsed_time": "20:10:50", "remaining_time": "21:58:59", "throughput": 333.76, "total_tokens": 24247744} {"current_steps": 19150, "total_steps": 40000, "loss": 0.0333, "lr": 0.16001814476393322, "epoch": 0.935675371949283, "percentage": 47.88, "elapsed_time": "20:10:53", "remaining_time": "21:58:23", "throughput": 333.82, "total_tokens": 24253472} {"current_steps": 19155, "total_steps": 40000, "loss": 0.0863, "lr": 0.15995937065271104, "epoch": 0.9359196736129773, "percentage": 47.89, "elapsed_time": "20:10:56", "remaining_time": "21:57:47", "throughput": 333.9, "total_tokens": 24260000} {"current_steps": 19160, "total_steps": 40000, "loss": 0.0743, "lr": 0.15990059500562873, "epoch": 0.9361639752766716, "percentage": 47.9, "elapsed_time": "20:11:00", "remaining_time": "21:57:11", "throughput": 333.98, "total_tokens": 24266816} {"current_steps": 19165, "total_steps": 40000, "loss": 0.055, "lr": 0.15984181783175025, "epoch": 0.936408276940366, "percentage": 47.91, "elapsed_time": "20:11:03", "remaining_time": "21:56:34", "throughput": 334.04, "total_tokens": 24272736} {"current_steps": 19170, "total_steps": 40000, "loss": 0.0544, "lr": 0.1597830391401398, "epoch": 0.9366525786040603, "percentage": 47.93, "elapsed_time": "20:11:06", "remaining_time": "21:55:58", "throughput": 334.12, "total_tokens": 24279552} {"current_steps": 19175, "total_steps": 40000, "loss": 0.0736, "lr": 0.15972425893986178, "epoch": 0.9368968802677546, "percentage": 47.94, "elapsed_time": "20:11:09", "remaining_time": "21:55:22", "throughput": 334.2, "total_tokens": 24285824} {"current_steps": 19180, "total_steps": 40000, "loss": 0.0728, "lr": 0.15966547723998084, "epoch": 0.9371411819314489, "percentage": 47.95, "elapsed_time": "20:11:12", "remaining_time": "21:54:46", "throughput": 334.26, "total_tokens": 24291840} {"current_steps": 19185, "total_steps": 40000, "loss": 0.0666, "lr": 0.15960669404956176, "epoch": 0.9373854835951433, "percentage": 47.96, "elapsed_time": "20:11:15", "remaining_time": "21:54:10", "throughput": 334.33, "total_tokens": 24297728} {"current_steps": 19190, "total_steps": 40000, "loss": 0.0487, "lr": 0.1595479093776698, "epoch": 0.9376297852588377, "percentage": 47.98, "elapsed_time": "20:11:18", "remaining_time": "21:53:34", "throughput": 334.4, "total_tokens": 24303968} {"current_steps": 19195, "total_steps": 40000, "loss": 0.0595, "lr": 0.15948912323337022, "epoch": 0.9378740869225319, "percentage": 47.99, "elapsed_time": "20:11:21", "remaining_time": "21:52:58", "throughput": 334.48, "total_tokens": 24310848} {"current_steps": 19200, "total_steps": 40000, "loss": 0.0543, "lr": 0.1594303356257286, "epoch": 0.9381183885862263, "percentage": 48.0, "elapsed_time": "20:11:24", "remaining_time": "21:52:21", "throughput": 334.56, "total_tokens": 24317280} {"current_steps": 19200, "total_steps": 40000, "eval_loss": 0.06483117491006851, "epoch": 0.9381183885862263, "percentage": 48.0, "elapsed_time": "20:22:05", "remaining_time": "22:03:55", "throughput": 331.64, "total_tokens": 24317280} {"current_steps": 19205, "total_steps": 40000, "loss": 0.0421, "lr": 0.15937154656381072, "epoch": 0.9383626902499206, "percentage": 48.01, "elapsed_time": "20:22:09", "remaining_time": "22:03:20", "throughput": 331.71, "total_tokens": 24323840} {"current_steps": 19210, "total_steps": 40000, "loss": 0.0603, "lr": 0.15931275605668258, "epoch": 0.938606991913615, "percentage": 48.02, "elapsed_time": "20:22:12", "remaining_time": "22:02:44", "throughput": 331.78, "total_tokens": 24330208} {"current_steps": 19215, "total_steps": 40000, "loss": 0.0642, "lr": 0.1592539641134104, "epoch": 0.9388512935773092, "percentage": 48.04, "elapsed_time": "20:22:15", "remaining_time": "22:02:07", "throughput": 331.85, "total_tokens": 24336416} {"current_steps": 19220, "total_steps": 40000, "loss": 0.0414, "lr": 0.1591951707430607, "epoch": 0.9390955952410036, "percentage": 48.05, "elapsed_time": "20:22:18", "remaining_time": "22:01:31", "throughput": 331.92, "total_tokens": 24342880} {"current_steps": 19225, "total_steps": 40000, "loss": 0.0575, "lr": 0.15913637595470007, "epoch": 0.9393398969046979, "percentage": 48.06, "elapsed_time": "20:22:21", "remaining_time": "22:00:55", "throughput": 332.0, "total_tokens": 24349728} {"current_steps": 19230, "total_steps": 40000, "loss": 0.0635, "lr": 0.15907757975739548, "epoch": 0.9395841985683923, "percentage": 48.08, "elapsed_time": "20:22:25", "remaining_time": "22:00:18", "throughput": 332.07, "total_tokens": 24356000} {"current_steps": 19235, "total_steps": 40000, "loss": 0.0846, "lr": 0.159018782160214, "epoch": 0.9398285002320865, "percentage": 48.09, "elapsed_time": "20:22:27", "remaining_time": "21:59:42", "throughput": 332.14, "total_tokens": 24361984} {"current_steps": 19240, "total_steps": 40000, "loss": 0.0527, "lr": 0.158959983172223, "epoch": 0.9400728018957809, "percentage": 48.1, "elapsed_time": "20:22:31", "remaining_time": "21:59:06", "throughput": 332.22, "total_tokens": 24368832} {"current_steps": 19245, "total_steps": 40000, "loss": 0.0671, "lr": 0.15890118280249, "epoch": 0.9403171035594753, "percentage": 48.11, "elapsed_time": "20:22:34", "remaining_time": "21:58:29", "throughput": 332.3, "total_tokens": 24375712} {"current_steps": 19250, "total_steps": 40000, "loss": 0.0563, "lr": 0.15884238106008275, "epoch": 0.9405614052231696, "percentage": 48.12, "elapsed_time": "20:22:37", "remaining_time": "21:57:53", "throughput": 332.38, "total_tokens": 24382208} {"current_steps": 19255, "total_steps": 40000, "loss": 0.0474, "lr": 0.15878357795406922, "epoch": 0.9408057068868639, "percentage": 48.14, "elapsed_time": "20:22:40", "remaining_time": "21:57:17", "throughput": 332.44, "total_tokens": 24388288} {"current_steps": 19260, "total_steps": 40000, "loss": 0.0458, "lr": 0.15872477349351757, "epoch": 0.9410500085505582, "percentage": 48.15, "elapsed_time": "20:22:43", "remaining_time": "21:56:41", "throughput": 332.52, "total_tokens": 24394720} {"current_steps": 19265, "total_steps": 40000, "loss": 0.0398, "lr": 0.15866596768749622, "epoch": 0.9412943102142526, "percentage": 48.16, "elapsed_time": "20:22:46", "remaining_time": "21:56:04", "throughput": 332.59, "total_tokens": 24401312} {"current_steps": 19270, "total_steps": 40000, "loss": 0.0866, "lr": 0.15860716054507373, "epoch": 0.9415386118779469, "percentage": 48.18, "elapsed_time": "20:22:49", "remaining_time": "21:55:28", "throughput": 332.66, "total_tokens": 24407584} {"current_steps": 19275, "total_steps": 40000, "loss": 0.0862, "lr": 0.1585483520753189, "epoch": 0.9417829135416412, "percentage": 48.19, "elapsed_time": "20:22:53", "remaining_time": "21:54:52", "throughput": 332.74, "total_tokens": 24414144} {"current_steps": 19280, "total_steps": 40000, "loss": 0.0921, "lr": 0.1584895422873008, "epoch": 0.9420272152053355, "percentage": 48.2, "elapsed_time": "20:22:56", "remaining_time": "21:54:16", "throughput": 332.81, "total_tokens": 24420640} {"current_steps": 19285, "total_steps": 40000, "loss": 0.0811, "lr": 0.1584307311900886, "epoch": 0.9422715168690299, "percentage": 48.21, "elapsed_time": "20:22:59", "remaining_time": "21:53:40", "throughput": 332.89, "total_tokens": 24426880} {"current_steps": 19290, "total_steps": 40000, "loss": 0.0323, "lr": 0.1583719187927517, "epoch": 0.9425158185327243, "percentage": 48.23, "elapsed_time": "20:23:02", "remaining_time": "21:53:04", "throughput": 332.96, "total_tokens": 24433376} {"current_steps": 19295, "total_steps": 40000, "loss": 0.0781, "lr": 0.15831310510435967, "epoch": 0.9427601201964185, "percentage": 48.24, "elapsed_time": "20:23:05", "remaining_time": "21:52:28", "throughput": 333.04, "total_tokens": 24440000} {"current_steps": 19300, "total_steps": 40000, "loss": 0.04, "lr": 0.15825429013398243, "epoch": 0.9430044218601129, "percentage": 48.25, "elapsed_time": "20:23:08", "remaining_time": "21:51:52", "throughput": 333.11, "total_tokens": 24446464} {"current_steps": 19305, "total_steps": 40000, "loss": 0.0605, "lr": 0.15819547389068986, "epoch": 0.9432487235238072, "percentage": 48.26, "elapsed_time": "20:23:11", "remaining_time": "21:51:16", "throughput": 333.18, "total_tokens": 24452992} {"current_steps": 19310, "total_steps": 40000, "loss": 0.0753, "lr": 0.1581366563835522, "epoch": 0.9434930251875016, "percentage": 48.27, "elapsed_time": "20:23:14", "remaining_time": "21:50:40", "throughput": 333.26, "total_tokens": 24459680} {"current_steps": 19315, "total_steps": 40000, "loss": 0.1059, "lr": 0.15807783762163993, "epoch": 0.9437373268511958, "percentage": 48.29, "elapsed_time": "20:23:17", "remaining_time": "21:50:04", "throughput": 333.33, "total_tokens": 24466048} {"current_steps": 19320, "total_steps": 40000, "loss": 0.0736, "lr": 0.15801901761402365, "epoch": 0.9439816285148902, "percentage": 48.3, "elapsed_time": "20:23:21", "remaining_time": "21:49:28", "throughput": 333.41, "total_tokens": 24472832} {"current_steps": 19325, "total_steps": 40000, "loss": 0.0613, "lr": 0.157960196369774, "epoch": 0.9442259301785845, "percentage": 48.31, "elapsed_time": "20:23:24", "remaining_time": "21:48:52", "throughput": 333.49, "total_tokens": 24479488} {"current_steps": 19330, "total_steps": 40000, "loss": 0.0561, "lr": 0.157901373897962, "epoch": 0.9444702318422789, "percentage": 48.33, "elapsed_time": "20:23:27", "remaining_time": "21:48:16", "throughput": 333.56, "total_tokens": 24485440} {"current_steps": 19335, "total_steps": 40000, "loss": 0.0808, "lr": 0.15784255020765892, "epoch": 0.9447145335059732, "percentage": 48.34, "elapsed_time": "20:23:30", "remaining_time": "21:47:40", "throughput": 333.62, "total_tokens": 24491360} {"current_steps": 19340, "total_steps": 40000, "loss": 0.075, "lr": 0.157783725307936, "epoch": 0.9449588351696675, "percentage": 48.35, "elapsed_time": "20:23:33", "remaining_time": "21:47:04", "throughput": 333.69, "total_tokens": 24497504} {"current_steps": 19345, "total_steps": 40000, "loss": 0.047, "lr": 0.15772489920786484, "epoch": 0.9452031368333619, "percentage": 48.36, "elapsed_time": "20:23:36", "remaining_time": "21:46:28", "throughput": 333.77, "total_tokens": 24504128} {"current_steps": 19350, "total_steps": 40000, "loss": 0.0548, "lr": 0.15766607191651713, "epoch": 0.9454474384970561, "percentage": 48.38, "elapsed_time": "20:23:39", "remaining_time": "21:45:52", "throughput": 333.84, "total_tokens": 24510560} {"current_steps": 19355, "total_steps": 40000, "loss": 0.06, "lr": 0.1576072434429648, "epoch": 0.9456917401607505, "percentage": 48.39, "elapsed_time": "20:23:42", "remaining_time": "21:45:16", "throughput": 333.92, "total_tokens": 24517088} {"current_steps": 19360, "total_steps": 40000, "loss": 0.0645, "lr": 0.15754841379627998, "epoch": 0.9459360418244448, "percentage": 48.4, "elapsed_time": "20:23:45", "remaining_time": "21:44:40", "throughput": 333.99, "total_tokens": 24523520} {"current_steps": 19365, "total_steps": 40000, "loss": 0.0563, "lr": 0.15748958298553484, "epoch": 0.9461803434881392, "percentage": 48.41, "elapsed_time": "20:23:48", "remaining_time": "21:44:04", "throughput": 334.06, "total_tokens": 24529728} {"current_steps": 19370, "total_steps": 40000, "loss": 0.0591, "lr": 0.1574307510198019, "epoch": 0.9464246451518334, "percentage": 48.43, "elapsed_time": "20:23:51", "remaining_time": "21:43:28", "throughput": 334.13, "total_tokens": 24535936} {"current_steps": 19375, "total_steps": 40000, "loss": 0.0854, "lr": 0.15737191790815375, "epoch": 0.9466689468155278, "percentage": 48.44, "elapsed_time": "20:23:55", "remaining_time": "21:42:52", "throughput": 334.2, "total_tokens": 24541856} {"current_steps": 19380, "total_steps": 40000, "loss": 0.0546, "lr": 0.15731308365966323, "epoch": 0.9469132484792221, "percentage": 48.45, "elapsed_time": "20:23:58", "remaining_time": "21:42:16", "throughput": 334.27, "total_tokens": 24547872} {"current_steps": 19385, "total_steps": 40000, "loss": 0.0577, "lr": 0.15725424828340331, "epoch": 0.9471575501429165, "percentage": 48.46, "elapsed_time": "20:24:01", "remaining_time": "21:41:41", "throughput": 334.34, "total_tokens": 24554208} {"current_steps": 19390, "total_steps": 40000, "loss": 0.0643, "lr": 0.15719541178844715, "epoch": 0.9474018518066109, "percentage": 48.48, "elapsed_time": "20:24:04", "remaining_time": "21:41:05", "throughput": 334.41, "total_tokens": 24560672} {"current_steps": 19395, "total_steps": 40000, "loss": 0.0597, "lr": 0.15713657418386806, "epoch": 0.9476461534703051, "percentage": 48.49, "elapsed_time": "20:24:07", "remaining_time": "21:40:29", "throughput": 334.48, "total_tokens": 24566880} {"current_steps": 19400, "total_steps": 40000, "loss": 0.0599, "lr": 0.15707773547873957, "epoch": 0.9478904551339995, "percentage": 48.5, "elapsed_time": "20:24:10", "remaining_time": "21:39:53", "throughput": 334.55, "total_tokens": 24573184} {"current_steps": 19400, "total_steps": 40000, "eval_loss": 0.06481385231018066, "epoch": 0.9478904551339995, "percentage": 48.5, "elapsed_time": "20:34:50", "remaining_time": "21:51:13", "throughput": 331.66, "total_tokens": 24573184} {"current_steps": 19405, "total_steps": 40000, "loss": 0.0492, "lr": 0.1570188956821353, "epoch": 0.9481347567976938, "percentage": 48.51, "elapsed_time": "20:34:54", "remaining_time": "21:50:38", "throughput": 331.72, "total_tokens": 24578912} {"current_steps": 19410, "total_steps": 40000, "loss": 0.0408, "lr": 0.1569600548031291, "epoch": 0.9483790584613881, "percentage": 48.52, "elapsed_time": "20:34:57", "remaining_time": "21:50:01", "throughput": 331.79, "total_tokens": 24585088} {"current_steps": 19415, "total_steps": 40000, "loss": 0.0355, "lr": 0.156901212850795, "epoch": 0.9486233601250824, "percentage": 48.54, "elapsed_time": "20:35:00", "remaining_time": "21:49:25", "throughput": 331.87, "total_tokens": 24591456} {"current_steps": 19420, "total_steps": 40000, "loss": 0.0724, "lr": 0.15684236983420716, "epoch": 0.9488676617887768, "percentage": 48.55, "elapsed_time": "20:35:03", "remaining_time": "21:48:49", "throughput": 331.94, "total_tokens": 24597696} {"current_steps": 19425, "total_steps": 40000, "loss": 0.0611, "lr": 0.1567835257624399, "epoch": 0.9491119634524711, "percentage": 48.56, "elapsed_time": "20:35:06", "remaining_time": "21:48:13", "throughput": 332.01, "total_tokens": 24603808} {"current_steps": 19430, "total_steps": 40000, "loss": 0.0781, "lr": 0.1567246806445677, "epoch": 0.9493562651161654, "percentage": 48.58, "elapsed_time": "20:35:09", "remaining_time": "21:47:37", "throughput": 332.07, "total_tokens": 24609760} {"current_steps": 19435, "total_steps": 40000, "loss": 0.103, "lr": 0.15666583448966526, "epoch": 0.9496005667798598, "percentage": 48.59, "elapsed_time": "20:35:12", "remaining_time": "21:47:01", "throughput": 332.14, "total_tokens": 24616064} {"current_steps": 19440, "total_steps": 40000, "loss": 0.0603, "lr": 0.1566069873068074, "epoch": 0.9498448684435541, "percentage": 48.6, "elapsed_time": "20:35:15", "remaining_time": "21:46:25", "throughput": 332.22, "total_tokens": 24622528} {"current_steps": 19445, "total_steps": 40000, "loss": 0.1151, "lr": 0.156548139105069, "epoch": 0.9500891701072485, "percentage": 48.61, "elapsed_time": "20:35:18", "remaining_time": "21:45:49", "throughput": 332.28, "total_tokens": 24628448} {"current_steps": 19450, "total_steps": 40000, "loss": 0.0639, "lr": 0.15648928989352529, "epoch": 0.9503334717709427, "percentage": 48.62, "elapsed_time": "20:35:21", "remaining_time": "21:45:13", "throughput": 332.36, "total_tokens": 24634752} {"current_steps": 19455, "total_steps": 40000, "loss": 0.0753, "lr": 0.15643043968125156, "epoch": 0.9505777734346371, "percentage": 48.64, "elapsed_time": "20:35:25", "remaining_time": "21:44:38", "throughput": 332.43, "total_tokens": 24641632} {"current_steps": 19460, "total_steps": 40000, "loss": 0.0589, "lr": 0.15637158847732316, "epoch": 0.9508220750983314, "percentage": 48.65, "elapsed_time": "20:35:28", "remaining_time": "21:44:01", "throughput": 332.5, "total_tokens": 24647616} {"current_steps": 19465, "total_steps": 40000, "loss": 0.0762, "lr": 0.15631273629081582, "epoch": 0.9510663767620258, "percentage": 48.66, "elapsed_time": "20:35:31", "remaining_time": "21:43:26", "throughput": 332.57, "total_tokens": 24654048} {"current_steps": 19470, "total_steps": 40000, "loss": 0.0669, "lr": 0.15625388313080518, "epoch": 0.95131067842572, "percentage": 48.68, "elapsed_time": "20:35:34", "remaining_time": "21:42:50", "throughput": 332.64, "total_tokens": 24660160} {"current_steps": 19475, "total_steps": 40000, "loss": 0.0469, "lr": 0.15619502900636714, "epoch": 0.9515549800894144, "percentage": 48.69, "elapsed_time": "20:35:37", "remaining_time": "21:42:14", "throughput": 332.71, "total_tokens": 24666272} {"current_steps": 19480, "total_steps": 40000, "loss": 0.0699, "lr": 0.15613617392657783, "epoch": 0.9517992817531087, "percentage": 48.7, "elapsed_time": "20:35:40", "remaining_time": "21:41:38", "throughput": 332.78, "total_tokens": 24672320} {"current_steps": 19485, "total_steps": 40000, "loss": 0.0741, "lr": 0.15607731790051335, "epoch": 0.9520435834168031, "percentage": 48.71, "elapsed_time": "20:35:43", "remaining_time": "21:41:02", "throughput": 332.85, "total_tokens": 24678368} {"current_steps": 19490, "total_steps": 40000, "loss": 0.0531, "lr": 0.15601846093725008, "epoch": 0.9522878850804974, "percentage": 48.73, "elapsed_time": "20:35:46", "remaining_time": "21:40:26", "throughput": 332.92, "total_tokens": 24684512} {"current_steps": 19495, "total_steps": 40000, "loss": 0.0781, "lr": 0.1559596030458645, "epoch": 0.9525321867441917, "percentage": 48.74, "elapsed_time": "20:35:49", "remaining_time": "21:39:50", "throughput": 332.98, "total_tokens": 24690592} {"current_steps": 19500, "total_steps": 40000, "loss": 0.051, "lr": 0.1559007442354333, "epoch": 0.9527764884078861, "percentage": 48.75, "elapsed_time": "20:35:52", "remaining_time": "21:39:15", "throughput": 333.06, "total_tokens": 24697120} {"current_steps": 19505, "total_steps": 40000, "loss": 0.0886, "lr": 0.15584188451503314, "epoch": 0.9530207900715804, "percentage": 48.76, "elapsed_time": "20:35:55", "remaining_time": "21:38:39", "throughput": 333.12, "total_tokens": 24703008} {"current_steps": 19510, "total_steps": 40000, "loss": 0.0573, "lr": 0.15578302389374094, "epoch": 0.9532650917352747, "percentage": 48.77, "elapsed_time": "20:35:58", "remaining_time": "21:38:03", "throughput": 333.2, "total_tokens": 24709600} {"current_steps": 19515, "total_steps": 40000, "loss": 0.0598, "lr": 0.1557241623806338, "epoch": 0.953509393398969, "percentage": 48.79, "elapsed_time": "20:36:01", "remaining_time": "21:37:27", "throughput": 333.27, "total_tokens": 24716224} {"current_steps": 19520, "total_steps": 40000, "loss": 0.0686, "lr": 0.15566529998478887, "epoch": 0.9537536950626634, "percentage": 48.8, "elapsed_time": "20:36:04", "remaining_time": "21:36:52", "throughput": 333.35, "total_tokens": 24722912} {"current_steps": 19525, "total_steps": 40000, "loss": 0.0508, "lr": 0.15560643671528354, "epoch": 0.9539979967263577, "percentage": 48.81, "elapsed_time": "20:36:08", "remaining_time": "21:36:16", "throughput": 333.43, "total_tokens": 24729504} {"current_steps": 19530, "total_steps": 40000, "loss": 0.0334, "lr": 0.15554757258119514, "epoch": 0.954242298390052, "percentage": 48.83, "elapsed_time": "20:36:11", "remaining_time": "21:35:41", "throughput": 333.5, "total_tokens": 24736064} {"current_steps": 19535, "total_steps": 40000, "loss": 0.0499, "lr": 0.1554887075916014, "epoch": 0.9544866000537464, "percentage": 48.84, "elapsed_time": "20:36:14", "remaining_time": "21:35:05", "throughput": 333.57, "total_tokens": 24742496} {"current_steps": 19540, "total_steps": 40000, "loss": 0.0572, "lr": 0.15542984175558, "epoch": 0.9547309017174407, "percentage": 48.85, "elapsed_time": "20:36:17", "remaining_time": "21:34:29", "throughput": 333.64, "total_tokens": 24748672} {"current_steps": 19545, "total_steps": 40000, "loss": 0.0383, "lr": 0.1553709750822087, "epoch": 0.9549752033811351, "percentage": 48.86, "elapsed_time": "20:36:20", "remaining_time": "21:33:54", "throughput": 333.71, "total_tokens": 24754976} {"current_steps": 19550, "total_steps": 40000, "loss": 0.0845, "lr": 0.15531210758056554, "epoch": 0.9552195050448293, "percentage": 48.88, "elapsed_time": "20:36:23", "remaining_time": "21:33:18", "throughput": 333.79, "total_tokens": 24761376} {"current_steps": 19555, "total_steps": 40000, "loss": 0.0608, "lr": 0.15525323925972867, "epoch": 0.9554638067085237, "percentage": 48.89, "elapsed_time": "20:36:26", "remaining_time": "21:32:43", "throughput": 333.86, "total_tokens": 24767584} {"current_steps": 19560, "total_steps": 40000, "loss": 0.0603, "lr": 0.15519437012877627, "epoch": 0.955708108372218, "percentage": 48.9, "elapsed_time": "20:36:29", "remaining_time": "21:32:07", "throughput": 333.93, "total_tokens": 24774144} {"current_steps": 19565, "total_steps": 40000, "loss": 0.0694, "lr": 0.15513550019678676, "epoch": 0.9559524100359124, "percentage": 48.91, "elapsed_time": "20:36:32", "remaining_time": "21:31:32", "throughput": 334.0, "total_tokens": 24780448} {"current_steps": 19570, "total_steps": 40000, "loss": 0.0464, "lr": 0.15507662947283854, "epoch": 0.9561967116996066, "percentage": 48.93, "elapsed_time": "20:36:36", "remaining_time": "21:30:56", "throughput": 334.08, "total_tokens": 24787392} {"current_steps": 19575, "total_steps": 40000, "loss": 0.0572, "lr": 0.15501775796601028, "epoch": 0.956441013363301, "percentage": 48.94, "elapsed_time": "20:36:39", "remaining_time": "21:30:21", "throughput": 334.15, "total_tokens": 24793632} {"current_steps": 19580, "total_steps": 40000, "loss": 0.084, "lr": 0.15495888568538066, "epoch": 0.9566853150269954, "percentage": 48.95, "elapsed_time": "20:36:42", "remaining_time": "21:29:45", "throughput": 334.23, "total_tokens": 24800672} {"current_steps": 19585, "total_steps": 40000, "loss": 0.0526, "lr": 0.1549000126400286, "epoch": 0.9569296166906897, "percentage": 48.96, "elapsed_time": "20:36:45", "remaining_time": "21:29:10", "throughput": 334.31, "total_tokens": 24807616} {"current_steps": 19590, "total_steps": 40000, "loss": 0.0532, "lr": 0.15484113883903294, "epoch": 0.957173918354384, "percentage": 48.98, "elapsed_time": "20:36:48", "remaining_time": "21:28:34", "throughput": 334.38, "total_tokens": 24814080} {"current_steps": 19595, "total_steps": 40000, "loss": 0.0717, "lr": 0.15478226429147288, "epoch": 0.9574182200180783, "percentage": 48.99, "elapsed_time": "20:36:51", "remaining_time": "21:27:59", "throughput": 334.46, "total_tokens": 24820576} {"current_steps": 19600, "total_steps": 40000, "loss": 0.1142, "lr": 0.15472338900642757, "epoch": 0.9576625216817727, "percentage": 49.0, "elapsed_time": "20:36:54", "remaining_time": "21:27:23", "throughput": 334.52, "total_tokens": 24826560} {"current_steps": 19600, "total_steps": 40000, "eval_loss": 0.06485845893621445, "epoch": 0.9576625216817727, "percentage": 49.0, "elapsed_time": "20:47:35", "remaining_time": "21:38:30", "throughput": 331.66, "total_tokens": 24826560} {"current_steps": 19605, "total_steps": 40000, "loss": 0.077, "lr": 0.15466451299297632, "epoch": 0.957906823345467, "percentage": 49.01, "elapsed_time": "20:47:38", "remaining_time": "21:37:55", "throughput": 331.73, "total_tokens": 24832736} {"current_steps": 19610, "total_steps": 40000, "loss": 0.0851, "lr": 0.15460563626019852, "epoch": 0.9581511250091613, "percentage": 49.02, "elapsed_time": "20:47:42", "remaining_time": "21:37:19", "throughput": 331.8, "total_tokens": 24839296} {"current_steps": 19615, "total_steps": 40000, "loss": 0.0668, "lr": 0.15454675881717375, "epoch": 0.9583954266728556, "percentage": 49.04, "elapsed_time": "20:47:45", "remaining_time": "21:36:44", "throughput": 331.87, "total_tokens": 24845600} {"current_steps": 19620, "total_steps": 40000, "loss": 0.0556, "lr": 0.1544878806729816, "epoch": 0.95863972833655, "percentage": 49.05, "elapsed_time": "20:47:48", "remaining_time": "21:36:08", "throughput": 331.94, "total_tokens": 24851712} {"current_steps": 19625, "total_steps": 40000, "loss": 0.0575, "lr": 0.1544290018367019, "epoch": 0.9588840300002442, "percentage": 49.06, "elapsed_time": "20:47:51", "remaining_time": "21:35:32", "throughput": 332.02, "total_tokens": 24858496} {"current_steps": 19630, "total_steps": 40000, "loss": 0.0555, "lr": 0.15437012231741445, "epoch": 0.9591283316639386, "percentage": 49.08, "elapsed_time": "20:47:54", "remaining_time": "21:34:57", "throughput": 332.09, "total_tokens": 24865088} {"current_steps": 19635, "total_steps": 40000, "loss": 0.0501, "lr": 0.1543112421241992, "epoch": 0.959372633327633, "percentage": 49.09, "elapsed_time": "20:47:57", "remaining_time": "21:34:21", "throughput": 332.16, "total_tokens": 24871264} {"current_steps": 19640, "total_steps": 40000, "loss": 0.074, "lr": 0.15425236126613626, "epoch": 0.9596169349913273, "percentage": 49.1, "elapsed_time": "20:48:00", "remaining_time": "21:33:45", "throughput": 332.23, "total_tokens": 24877280} {"current_steps": 19645, "total_steps": 40000, "loss": 0.0566, "lr": 0.15419347975230577, "epoch": 0.9598612366550217, "percentage": 49.11, "elapsed_time": "20:48:03", "remaining_time": "21:33:10", "throughput": 332.29, "total_tokens": 24883392} {"current_steps": 19650, "total_steps": 40000, "loss": 0.0582, "lr": 0.154134597591788, "epoch": 0.9601055383187159, "percentage": 49.12, "elapsed_time": "20:48:06", "remaining_time": "21:32:34", "throughput": 332.37, "total_tokens": 24889984} {"current_steps": 19655, "total_steps": 40000, "loss": 0.0612, "lr": 0.1540757147936633, "epoch": 0.9603498399824103, "percentage": 49.14, "elapsed_time": "20:48:09", "remaining_time": "21:31:58", "throughput": 332.44, "total_tokens": 24896576} {"current_steps": 19660, "total_steps": 40000, "loss": 0.0437, "lr": 0.1540168313670122, "epoch": 0.9605941416461046, "percentage": 49.15, "elapsed_time": "20:48:12", "remaining_time": "21:31:23", "throughput": 332.51, "total_tokens": 24902944} {"current_steps": 19665, "total_steps": 40000, "loss": 0.0595, "lr": 0.1539579473209152, "epoch": 0.960838443309799, "percentage": 49.16, "elapsed_time": "20:48:16", "remaining_time": "21:30:47", "throughput": 332.59, "total_tokens": 24909760} {"current_steps": 19670, "total_steps": 40000, "loss": 0.0601, "lr": 0.15389906266445294, "epoch": 0.9610827449734932, "percentage": 49.18, "elapsed_time": "20:48:19", "remaining_time": "21:30:12", "throughput": 332.65, "total_tokens": 24915552} {"current_steps": 19675, "total_steps": 40000, "loss": 0.0688, "lr": 0.15384017740670627, "epoch": 0.9613270466371876, "percentage": 49.19, "elapsed_time": "20:48:22", "remaining_time": "21:29:36", "throughput": 332.72, "total_tokens": 24921792} {"current_steps": 19680, "total_steps": 40000, "loss": 0.0729, "lr": 0.15378129155675602, "epoch": 0.961571348300882, "percentage": 49.2, "elapsed_time": "20:48:25", "remaining_time": "21:29:01", "throughput": 332.79, "total_tokens": 24927968} {"current_steps": 19685, "total_steps": 40000, "loss": 0.0869, "lr": 0.15372240512368307, "epoch": 0.9618156499645762, "percentage": 49.21, "elapsed_time": "20:48:28", "remaining_time": "21:28:25", "throughput": 332.86, "total_tokens": 24933856} {"current_steps": 19690, "total_steps": 40000, "loss": 0.0548, "lr": 0.1536635181165684, "epoch": 0.9620599516282706, "percentage": 49.23, "elapsed_time": "20:48:31", "remaining_time": "21:27:50", "throughput": 332.93, "total_tokens": 24940192} {"current_steps": 19695, "total_steps": 40000, "loss": 0.0626, "lr": 0.15360463054449328, "epoch": 0.9623042532919649, "percentage": 49.24, "elapsed_time": "20:48:34", "remaining_time": "21:27:14", "throughput": 333.0, "total_tokens": 24946176} {"current_steps": 19700, "total_steps": 40000, "loss": 0.079, "lr": 0.1535457424165388, "epoch": 0.9625485549556593, "percentage": 49.25, "elapsed_time": "20:48:37", "remaining_time": "21:26:39", "throughput": 333.07, "total_tokens": 24952480} {"current_steps": 19705, "total_steps": 40000, "loss": 0.0912, "lr": 0.15348685374178628, "epoch": 0.9627928566193535, "percentage": 49.26, "elapsed_time": "20:48:40", "remaining_time": "21:26:03", "throughput": 333.14, "total_tokens": 24959008} {"current_steps": 19710, "total_steps": 40000, "loss": 0.0801, "lr": 0.1534279645293171, "epoch": 0.9630371582830479, "percentage": 49.28, "elapsed_time": "20:48:43", "remaining_time": "21:25:28", "throughput": 333.21, "total_tokens": 24965440} {"current_steps": 19715, "total_steps": 40000, "loss": 0.0675, "lr": 0.1533690747882127, "epoch": 0.9632814599467422, "percentage": 49.29, "elapsed_time": "20:48:46", "remaining_time": "21:24:53", "throughput": 333.28, "total_tokens": 24971712} {"current_steps": 19720, "total_steps": 40000, "loss": 0.0552, "lr": 0.15331018452755465, "epoch": 0.9635257616104366, "percentage": 49.3, "elapsed_time": "20:48:49", "remaining_time": "21:24:17", "throughput": 333.35, "total_tokens": 24977888} {"current_steps": 19725, "total_steps": 40000, "loss": 0.069, "lr": 0.15325129375642457, "epoch": 0.963770063274131, "percentage": 49.31, "elapsed_time": "20:48:53", "remaining_time": "21:23:42", "throughput": 333.42, "total_tokens": 24984288} {"current_steps": 19730, "total_steps": 40000, "loss": 0.0992, "lr": 0.15319240248390406, "epoch": 0.9640143649378252, "percentage": 49.33, "elapsed_time": "20:48:56", "remaining_time": "21:23:07", "throughput": 333.49, "total_tokens": 24990304} {"current_steps": 19735, "total_steps": 40000, "loss": 0.0568, "lr": 0.153133510719075, "epoch": 0.9642586666015196, "percentage": 49.34, "elapsed_time": "20:48:59", "remaining_time": "21:22:31", "throughput": 333.56, "total_tokens": 24996768} {"current_steps": 19740, "total_steps": 40000, "loss": 0.0682, "lr": 0.15307461847101922, "epoch": 0.9645029682652139, "percentage": 49.35, "elapsed_time": "20:49:02", "remaining_time": "21:21:56", "throughput": 333.63, "total_tokens": 25002848} {"current_steps": 19745, "total_steps": 40000, "loss": 0.0682, "lr": 0.15301572574881864, "epoch": 0.9647472699289082, "percentage": 49.36, "elapsed_time": "20:49:05", "remaining_time": "21:21:21", "throughput": 333.7, "total_tokens": 25009088} {"current_steps": 19750, "total_steps": 40000, "loss": 0.0534, "lr": 0.15295683256155523, "epoch": 0.9649915715926025, "percentage": 49.38, "elapsed_time": "20:49:08", "remaining_time": "21:20:45", "throughput": 333.78, "total_tokens": 25015968} {"current_steps": 19755, "total_steps": 40000, "loss": 0.07, "lr": 0.15289793891831113, "epoch": 0.9652358732562969, "percentage": 49.39, "elapsed_time": "20:49:11", "remaining_time": "21:20:10", "throughput": 333.85, "total_tokens": 25022272} {"current_steps": 19760, "total_steps": 40000, "loss": 0.0566, "lr": 0.15283904482816837, "epoch": 0.9654801749199912, "percentage": 49.4, "elapsed_time": "20:49:14", "remaining_time": "21:19:35", "throughput": 333.92, "total_tokens": 25028800} {"current_steps": 19765, "total_steps": 40000, "loss": 0.0646, "lr": 0.15278015030020928, "epoch": 0.9657244765836855, "percentage": 49.41, "elapsed_time": "20:49:17", "remaining_time": "21:19:00", "throughput": 333.99, "total_tokens": 25034784} {"current_steps": 19770, "total_steps": 40000, "loss": 0.0541, "lr": 0.152721255343516, "epoch": 0.9659687782473798, "percentage": 49.43, "elapsed_time": "20:49:20", "remaining_time": "21:18:24", "throughput": 334.05, "total_tokens": 25040800} {"current_steps": 19775, "total_steps": 40000, "loss": 0.0498, "lr": 0.15266235996717098, "epoch": 0.9662130799110742, "percentage": 49.44, "elapsed_time": "20:49:23", "remaining_time": "21:17:49", "throughput": 334.12, "total_tokens": 25047200} {"current_steps": 19780, "total_steps": 40000, "loss": 0.0603, "lr": 0.15260346418025664, "epoch": 0.9664573815747686, "percentage": 49.45, "elapsed_time": "20:49:26", "remaining_time": "21:17:14", "throughput": 334.2, "total_tokens": 25053664} {"current_steps": 19785, "total_steps": 40000, "loss": 0.0412, "lr": 0.15254456799185537, "epoch": 0.9667016832384628, "percentage": 49.46, "elapsed_time": "20:49:30", "remaining_time": "21:16:39", "throughput": 334.28, "total_tokens": 25060672} {"current_steps": 19790, "total_steps": 40000, "loss": 0.08, "lr": 0.15248567141104974, "epoch": 0.9669459849021572, "percentage": 49.48, "elapsed_time": "20:49:33", "remaining_time": "21:16:04", "throughput": 334.36, "total_tokens": 25068096} {"current_steps": 19795, "total_steps": 40000, "loss": 0.0717, "lr": 0.15242677444692232, "epoch": 0.9671902865658515, "percentage": 49.49, "elapsed_time": "20:49:36", "remaining_time": "21:15:29", "throughput": 334.44, "total_tokens": 25074912} {"current_steps": 19800, "total_steps": 40000, "loss": 0.0612, "lr": 0.15236787710855584, "epoch": 0.9674345882295459, "percentage": 49.5, "elapsed_time": "20:49:39", "remaining_time": "21:14:54", "throughput": 334.51, "total_tokens": 25081792} {"current_steps": 19800, "total_steps": 40000, "eval_loss": 0.0653596892952919, "epoch": 0.9674345882295459, "percentage": 49.5, "elapsed_time": "21:00:20", "remaining_time": "21:25:47", "throughput": 331.68, "total_tokens": 25081792} {"current_steps": 19805, "total_steps": 40000, "loss": 0.0589, "lr": 0.1523089794050329, "epoch": 0.9676788898932401, "percentage": 49.51, "elapsed_time": "21:00:23", "remaining_time": "21:25:12", "throughput": 331.74, "total_tokens": 25087712} {"current_steps": 19810, "total_steps": 40000, "loss": 0.1, "lr": 0.15225008134543633, "epoch": 0.9679231915569345, "percentage": 49.53, "elapsed_time": "21:00:26", "remaining_time": "21:24:37", "throughput": 331.81, "total_tokens": 25094016} {"current_steps": 19815, "total_steps": 40000, "loss": 0.053, "lr": 0.15219118293884895, "epoch": 0.9681674932206288, "percentage": 49.54, "elapsed_time": "21:00:29", "remaining_time": "21:24:02", "throughput": 331.88, "total_tokens": 25100384} {"current_steps": 19820, "total_steps": 40000, "loss": 0.0542, "lr": 0.15213228419435362, "epoch": 0.9684117948843232, "percentage": 49.55, "elapsed_time": "21:00:33", "remaining_time": "21:23:26", "throughput": 331.96, "total_tokens": 25107104} {"current_steps": 19825, "total_steps": 40000, "loss": 0.0877, "lr": 0.15207338512103327, "epoch": 0.9686560965480175, "percentage": 49.56, "elapsed_time": "21:00:36", "remaining_time": "21:22:51", "throughput": 332.03, "total_tokens": 25113440} {"current_steps": 19830, "total_steps": 40000, "loss": 0.0562, "lr": 0.1520144857279709, "epoch": 0.9689003982117118, "percentage": 49.58, "elapsed_time": "21:00:39", "remaining_time": "21:22:16", "throughput": 332.1, "total_tokens": 25119680} {"current_steps": 19835, "total_steps": 40000, "loss": 0.0601, "lr": 0.1519555860242495, "epoch": 0.9691446998754062, "percentage": 49.59, "elapsed_time": "21:00:42", "remaining_time": "21:21:40", "throughput": 332.16, "total_tokens": 25125728} {"current_steps": 19840, "total_steps": 40000, "loss": 0.043, "lr": 0.15189668601895218, "epoch": 0.9693890015391005, "percentage": 49.6, "elapsed_time": "21:00:45", "remaining_time": "21:21:05", "throughput": 332.23, "total_tokens": 25131776} {"current_steps": 19845, "total_steps": 40000, "loss": 0.0667, "lr": 0.151837785721162, "epoch": 0.9696333032027948, "percentage": 49.61, "elapsed_time": "21:00:48", "remaining_time": "21:20:30", "throughput": 332.3, "total_tokens": 25138016} {"current_steps": 19850, "total_steps": 40000, "loss": 0.0654, "lr": 0.15177888513996218, "epoch": 0.9698776048664891, "percentage": 49.62, "elapsed_time": "21:00:51", "remaining_time": "21:19:54", "throughput": 332.37, "total_tokens": 25144128} {"current_steps": 19855, "total_steps": 40000, "loss": 0.0568, "lr": 0.15171998428443592, "epoch": 0.9701219065301835, "percentage": 49.64, "elapsed_time": "21:00:54", "remaining_time": "21:19:19", "throughput": 332.44, "total_tokens": 25150528} {"current_steps": 19860, "total_steps": 40000, "loss": 0.0748, "lr": 0.1516610831636665, "epoch": 0.9703662081938778, "percentage": 49.65, "elapsed_time": "21:00:57", "remaining_time": "21:18:44", "throughput": 332.51, "total_tokens": 25156736} {"current_steps": 19865, "total_steps": 40000, "loss": 0.0627, "lr": 0.15160218178673715, "epoch": 0.9706105098575721, "percentage": 49.66, "elapsed_time": "21:01:00", "remaining_time": "21:18:09", "throughput": 332.58, "total_tokens": 25162848} {"current_steps": 19870, "total_steps": 40000, "loss": 0.062, "lr": 0.15154328016273122, "epoch": 0.9708548115212665, "percentage": 49.68, "elapsed_time": "21:01:03", "remaining_time": "21:17:33", "throughput": 332.64, "total_tokens": 25169120} {"current_steps": 19875, "total_steps": 40000, "loss": 0.0425, "lr": 0.1514843783007321, "epoch": 0.9710991131849608, "percentage": 49.69, "elapsed_time": "21:01:06", "remaining_time": "21:16:58", "throughput": 332.72, "total_tokens": 25175936} {"current_steps": 19880, "total_steps": 40000, "loss": 0.0934, "lr": 0.15142547620982322, "epoch": 0.9713434148486552, "percentage": 49.7, "elapsed_time": "21:01:10", "remaining_time": "21:16:23", "throughput": 332.79, "total_tokens": 25181920} {"current_steps": 19885, "total_steps": 40000, "loss": 0.0745, "lr": 0.15136657389908797, "epoch": 0.9715877165123494, "percentage": 49.71, "elapsed_time": "21:01:12", "remaining_time": "21:15:48", "throughput": 332.85, "total_tokens": 25187872} {"current_steps": 19890, "total_steps": 40000, "loss": 0.0696, "lr": 0.15130767137760986, "epoch": 0.9718320181760438, "percentage": 49.73, "elapsed_time": "21:01:16", "remaining_time": "21:15:13", "throughput": 332.92, "total_tokens": 25194016} {"current_steps": 19895, "total_steps": 40000, "loss": 0.0579, "lr": 0.15124876865447243, "epoch": 0.9720763198397381, "percentage": 49.74, "elapsed_time": "21:01:19", "remaining_time": "21:14:37", "throughput": 332.99, "total_tokens": 25200320} {"current_steps": 19900, "total_steps": 40000, "loss": 0.0462, "lr": 0.15118986573875912, "epoch": 0.9723206215034325, "percentage": 49.75, "elapsed_time": "21:01:22", "remaining_time": "21:14:02", "throughput": 333.06, "total_tokens": 25206944} {"current_steps": 19905, "total_steps": 40000, "loss": 0.0546, "lr": 0.15113096263955358, "epoch": 0.9725649231671267, "percentage": 49.76, "elapsed_time": "21:01:25", "remaining_time": "21:13:27", "throughput": 333.13, "total_tokens": 25212896} {"current_steps": 19910, "total_steps": 40000, "loss": 0.0352, "lr": 0.1510720593659394, "epoch": 0.9728092248308211, "percentage": 49.78, "elapsed_time": "21:01:28", "remaining_time": "21:12:52", "throughput": 333.2, "total_tokens": 25219584} {"current_steps": 19915, "total_steps": 40000, "loss": 0.0634, "lr": 0.15101315592700015, "epoch": 0.9730535264945154, "percentage": 49.79, "elapsed_time": "21:01:31", "remaining_time": "21:12:17", "throughput": 333.28, "total_tokens": 25226144} {"current_steps": 19920, "total_steps": 40000, "loss": 0.0796, "lr": 0.15095425233181956, "epoch": 0.9732978281582098, "percentage": 49.8, "elapsed_time": "21:01:34", "remaining_time": "21:11:42", "throughput": 333.34, "total_tokens": 25232320} {"current_steps": 19925, "total_steps": 40000, "loss": 0.0699, "lr": 0.15089534858948128, "epoch": 0.9735421298219041, "percentage": 49.81, "elapsed_time": "21:01:37", "remaining_time": "21:11:07", "throughput": 333.42, "total_tokens": 25238944} {"current_steps": 19930, "total_steps": 40000, "loss": 0.0574, "lr": 0.15083644470906898, "epoch": 0.9737864314855984, "percentage": 49.83, "elapsed_time": "21:01:40", "remaining_time": "21:10:32", "throughput": 333.49, "total_tokens": 25245376} {"current_steps": 19935, "total_steps": 40000, "loss": 0.0638, "lr": 0.1507775406996664, "epoch": 0.9740307331492928, "percentage": 49.84, "elapsed_time": "21:01:44", "remaining_time": "21:09:57", "throughput": 333.56, "total_tokens": 25251456} {"current_steps": 19940, "total_steps": 40000, "loss": 0.0609, "lr": 0.15071863657035725, "epoch": 0.974275034812987, "percentage": 49.85, "elapsed_time": "21:01:47", "remaining_time": "21:09:22", "throughput": 333.63, "total_tokens": 25258016} {"current_steps": 19945, "total_steps": 40000, "loss": 0.0584, "lr": 0.15065973233022534, "epoch": 0.9745193364766814, "percentage": 49.86, "elapsed_time": "21:01:50", "remaining_time": "21:08:47", "throughput": 333.7, "total_tokens": 25264448} {"current_steps": 19950, "total_steps": 40000, "loss": 0.0652, "lr": 0.15060082798835442, "epoch": 0.9747636381403757, "percentage": 49.88, "elapsed_time": "21:01:53", "remaining_time": "21:08:12", "throughput": 333.77, "total_tokens": 25270688} {"current_steps": 19955, "total_steps": 40000, "loss": 0.0603, "lr": 0.15054192355382823, "epoch": 0.9750079398040701, "percentage": 49.89, "elapsed_time": "21:01:56", "remaining_time": "21:07:37", "throughput": 333.84, "total_tokens": 25277056} {"current_steps": 19960, "total_steps": 40000, "loss": 0.0654, "lr": 0.15048301903573066, "epoch": 0.9752522414677643, "percentage": 49.9, "elapsed_time": "21:01:59", "remaining_time": "21:07:02", "throughput": 333.91, "total_tokens": 25283520} {"current_steps": 19965, "total_steps": 40000, "loss": 0.0539, "lr": 0.15042411444314546, "epoch": 0.9754965431314587, "percentage": 49.91, "elapsed_time": "21:02:02", "remaining_time": "21:06:28", "throughput": 333.98, "total_tokens": 25289664} {"current_steps": 19970, "total_steps": 40000, "loss": 0.0596, "lr": 0.1503652097851565, "epoch": 0.9757408447951531, "percentage": 49.93, "elapsed_time": "21:02:05", "remaining_time": "21:05:53", "throughput": 334.04, "total_tokens": 25295744} {"current_steps": 19975, "total_steps": 40000, "loss": 0.0788, "lr": 0.15030630507084758, "epoch": 0.9759851464588474, "percentage": 49.94, "elapsed_time": "21:02:08", "remaining_time": "21:05:18", "throughput": 334.11, "total_tokens": 25301504} {"current_steps": 19980, "total_steps": 40000, "loss": 0.0797, "lr": 0.1502474003093026, "epoch": 0.9762294481225418, "percentage": 49.95, "elapsed_time": "21:02:11", "remaining_time": "21:04:43", "throughput": 334.18, "total_tokens": 25307776} {"current_steps": 19985, "total_steps": 40000, "loss": 0.0512, "lr": 0.15018849550960536, "epoch": 0.976473749786236, "percentage": 49.96, "elapsed_time": "21:02:14", "remaining_time": "21:04:08", "throughput": 334.25, "total_tokens": 25313984} {"current_steps": 19990, "total_steps": 40000, "loss": 0.0494, "lr": 0.15012959068083975, "epoch": 0.9767180514499304, "percentage": 49.98, "elapsed_time": "21:02:17", "remaining_time": "21:03:33", "throughput": 334.31, "total_tokens": 25320064} {"current_steps": 19995, "total_steps": 40000, "loss": 0.0622, "lr": 0.1500706858320896, "epoch": 0.9769623531136247, "percentage": 49.99, "elapsed_time": "21:02:20", "remaining_time": "21:02:58", "throughput": 334.38, "total_tokens": 25326272} {"current_steps": 20000, "total_steps": 40000, "loss": 0.0332, "lr": 0.15001178097243886, "epoch": 0.977206654777319, "percentage": 50.0, "elapsed_time": "21:02:23", "remaining_time": "21:02:23", "throughput": 334.45, "total_tokens": 25332672} {"current_steps": 20000, "total_steps": 40000, "eval_loss": 0.06547097861766815, "epoch": 0.977206654777319, "percentage": 50.0, "elapsed_time": "21:13:03", "remaining_time": "21:13:03", "throughput": 331.65, "total_tokens": 25332672} {"current_steps": 20005, "total_steps": 40000, "loss": 0.0757, "lr": 0.1499528761109713, "epoch": 0.9774509564410133, "percentage": 50.01, "elapsed_time": "21:13:07", "remaining_time": "21:12:29", "throughput": 331.72, "total_tokens": 25339072} {"current_steps": 20010, "total_steps": 40000, "loss": 0.0615, "lr": 0.14989397125677087, "epoch": 0.9776952581047077, "percentage": 50.02, "elapsed_time": "21:13:10", "remaining_time": "21:11:54", "throughput": 331.78, "total_tokens": 25345056} {"current_steps": 20015, "total_steps": 40000, "loss": 0.0427, "lr": 0.14983506641892141, "epoch": 0.9779395597684021, "percentage": 50.04, "elapsed_time": "21:13:13", "remaining_time": "21:11:19", "throughput": 331.85, "total_tokens": 25351232} {"current_steps": 20020, "total_steps": 40000, "loss": 0.0738, "lr": 0.14977616160650672, "epoch": 0.9781838614320963, "percentage": 50.05, "elapsed_time": "21:13:17", "remaining_time": "21:10:44", "throughput": 331.93, "total_tokens": 25358400} {"current_steps": 20025, "total_steps": 40000, "loss": 0.0452, "lr": 0.14971725682861076, "epoch": 0.9784281630957907, "percentage": 50.06, "elapsed_time": "21:13:20", "remaining_time": "21:10:09", "throughput": 332.0, "total_tokens": 25364800} {"current_steps": 20030, "total_steps": 40000, "loss": 0.0373, "lr": 0.14965835209431738, "epoch": 0.978672464759485, "percentage": 50.08, "elapsed_time": "21:13:23", "remaining_time": "21:09:34", "throughput": 332.06, "total_tokens": 25370848} {"current_steps": 20035, "total_steps": 40000, "loss": 0.052, "lr": 0.14959944741271036, "epoch": 0.9789167664231794, "percentage": 50.09, "elapsed_time": "21:13:26", "remaining_time": "21:08:59", "throughput": 332.13, "total_tokens": 25377216} {"current_steps": 20040, "total_steps": 40000, "loss": 0.0468, "lr": 0.14954054279287363, "epoch": 0.9791610680868736, "percentage": 50.1, "elapsed_time": "21:13:29", "remaining_time": "21:08:24", "throughput": 332.2, "total_tokens": 25383488} {"current_steps": 20045, "total_steps": 40000, "loss": 0.0704, "lr": 0.14948163824389094, "epoch": 0.979405369750568, "percentage": 50.11, "elapsed_time": "21:13:32", "remaining_time": "21:07:49", "throughput": 332.27, "total_tokens": 25389920} {"current_steps": 20050, "total_steps": 40000, "loss": 0.067, "lr": 0.14942273377484613, "epoch": 0.9796496714142623, "percentage": 50.12, "elapsed_time": "21:13:35", "remaining_time": "21:07:14", "throughput": 332.34, "total_tokens": 25396128} {"current_steps": 20055, "total_steps": 40000, "loss": 0.0634, "lr": 0.1493638293948231, "epoch": 0.9798939730779567, "percentage": 50.14, "elapsed_time": "21:13:38", "remaining_time": "21:06:39", "throughput": 332.41, "total_tokens": 25402144} {"current_steps": 20060, "total_steps": 40000, "loss": 0.041, "lr": 0.14930492511290547, "epoch": 0.9801382747416509, "percentage": 50.15, "elapsed_time": "21:13:41", "remaining_time": "21:06:04", "throughput": 332.48, "total_tokens": 25409056} {"current_steps": 20065, "total_steps": 40000, "loss": 0.0632, "lr": 0.14924602093817715, "epoch": 0.9803825764053453, "percentage": 50.16, "elapsed_time": "21:13:45", "remaining_time": "21:05:29", "throughput": 332.56, "total_tokens": 25415712} {"current_steps": 20070, "total_steps": 40000, "loss": 0.0652, "lr": 0.14918711687972194, "epoch": 0.9806268780690397, "percentage": 50.18, "elapsed_time": "21:13:48", "remaining_time": "21:04:55", "throughput": 332.62, "total_tokens": 25421824} {"current_steps": 20075, "total_steps": 40000, "loss": 0.042, "lr": 0.14912821294662346, "epoch": 0.980871179732734, "percentage": 50.19, "elapsed_time": "21:13:51", "remaining_time": "21:04:19", "throughput": 332.68, "total_tokens": 25427424} {"current_steps": 20080, "total_steps": 40000, "loss": 0.0634, "lr": 0.14906930914796554, "epoch": 0.9811154813964283, "percentage": 50.2, "elapsed_time": "21:13:54", "remaining_time": "21:03:45", "throughput": 332.75, "total_tokens": 25433696} {"current_steps": 20085, "total_steps": 40000, "loss": 0.0697, "lr": 0.14901040549283182, "epoch": 0.9813597830601226, "percentage": 50.21, "elapsed_time": "21:13:57", "remaining_time": "21:03:10", "throughput": 332.82, "total_tokens": 25440064} {"current_steps": 20090, "total_steps": 40000, "loss": 0.0762, "lr": 0.148951501990306, "epoch": 0.981604084723817, "percentage": 50.22, "elapsed_time": "21:14:00", "remaining_time": "21:02:35", "throughput": 332.9, "total_tokens": 25446688} {"current_steps": 20095, "total_steps": 40000, "loss": 0.0941, "lr": 0.14889259864947177, "epoch": 0.9818483863875113, "percentage": 50.24, "elapsed_time": "21:14:03", "remaining_time": "21:02:00", "throughput": 332.97, "total_tokens": 25453376} {"current_steps": 20100, "total_steps": 40000, "loss": 0.0632, "lr": 0.14883369547941272, "epoch": 0.9820926880512056, "percentage": 50.25, "elapsed_time": "21:14:06", "remaining_time": "21:01:25", "throughput": 333.03, "total_tokens": 25459200} {"current_steps": 20105, "total_steps": 40000, "loss": 0.0485, "lr": 0.14877479248921247, "epoch": 0.9823369897148999, "percentage": 50.26, "elapsed_time": "21:14:09", "remaining_time": "21:00:50", "throughput": 333.1, "total_tokens": 25465184} {"current_steps": 20110, "total_steps": 40000, "loss": 0.0507, "lr": 0.14871588968795468, "epoch": 0.9825812913785943, "percentage": 50.28, "elapsed_time": "21:14:12", "remaining_time": "21:00:16", "throughput": 333.17, "total_tokens": 25471872} {"current_steps": 20115, "total_steps": 40000, "loss": 0.0377, "lr": 0.1486569870847228, "epoch": 0.9828255930422887, "percentage": 50.29, "elapsed_time": "21:14:15", "remaining_time": "20:59:41", "throughput": 333.24, "total_tokens": 25478240} {"current_steps": 20120, "total_steps": 40000, "loss": 0.0689, "lr": 0.1485980846886004, "epoch": 0.9830698947059829, "percentage": 50.3, "elapsed_time": "21:14:18", "remaining_time": "20:59:06", "throughput": 333.31, "total_tokens": 25484288} {"current_steps": 20125, "total_steps": 40000, "loss": 0.0525, "lr": 0.14853918250867096, "epoch": 0.9833141963696773, "percentage": 50.31, "elapsed_time": "21:14:21", "remaining_time": "20:58:31", "throughput": 333.38, "total_tokens": 25490560} {"current_steps": 20130, "total_steps": 40000, "loss": 0.0571, "lr": 0.1484802805540179, "epoch": 0.9835584980333716, "percentage": 50.32, "elapsed_time": "21:14:24", "remaining_time": "20:57:57", "throughput": 333.44, "total_tokens": 25496352} {"current_steps": 20135, "total_steps": 40000, "loss": 0.0553, "lr": 0.14842137883372472, "epoch": 0.983802799697066, "percentage": 50.34, "elapsed_time": "21:14:27", "remaining_time": "20:57:22", "throughput": 333.5, "total_tokens": 25502080} {"current_steps": 20140, "total_steps": 40000, "loss": 0.0614, "lr": 0.14836247735687474, "epoch": 0.9840471013607602, "percentage": 50.35, "elapsed_time": "21:14:30", "remaining_time": "20:56:47", "throughput": 333.57, "total_tokens": 25508576} {"current_steps": 20145, "total_steps": 40000, "loss": 0.0543, "lr": 0.14830357613255132, "epoch": 0.9842914030244546, "percentage": 50.36, "elapsed_time": "21:14:33", "remaining_time": "20:56:13", "throughput": 333.64, "total_tokens": 25514688} {"current_steps": 20150, "total_steps": 40000, "loss": 0.0604, "lr": 0.1482446751698378, "epoch": 0.9845357046881489, "percentage": 50.38, "elapsed_time": "21:14:37", "remaining_time": "20:55:38", "throughput": 333.71, "total_tokens": 25521152} {"current_steps": 20155, "total_steps": 40000, "loss": 0.0588, "lr": 0.14818577447781744, "epoch": 0.9847800063518433, "percentage": 50.39, "elapsed_time": "21:14:40", "remaining_time": "20:55:03", "throughput": 333.79, "total_tokens": 25528000} {"current_steps": 20160, "total_steps": 40000, "loss": 0.0359, "lr": 0.14812687406557346, "epoch": 0.9850243080155375, "percentage": 50.4, "elapsed_time": "21:14:43", "remaining_time": "20:54:29", "throughput": 333.85, "total_tokens": 25533984} {"current_steps": 20165, "total_steps": 40000, "loss": 0.0745, "lr": 0.14806797394218899, "epoch": 0.9852686096792319, "percentage": 50.41, "elapsed_time": "21:14:46", "remaining_time": "20:53:54", "throughput": 333.92, "total_tokens": 25540576} {"current_steps": 20170, "total_steps": 40000, "loss": 0.0733, "lr": 0.1480090741167472, "epoch": 0.9855129113429263, "percentage": 50.42, "elapsed_time": "21:14:49", "remaining_time": "20:53:20", "throughput": 333.99, "total_tokens": 25546912} {"current_steps": 20175, "total_steps": 40000, "loss": 0.0532, "lr": 0.1479501745983313, "epoch": 0.9857572130066206, "percentage": 50.44, "elapsed_time": "21:14:52", "remaining_time": "20:52:45", "throughput": 334.06, "total_tokens": 25552992} {"current_steps": 20180, "total_steps": 40000, "loss": 0.0535, "lr": 0.14789127539602415, "epoch": 0.9860015146703149, "percentage": 50.45, "elapsed_time": "21:14:55", "remaining_time": "20:52:11", "throughput": 334.13, "total_tokens": 25559680} {"current_steps": 20185, "total_steps": 40000, "loss": 0.0451, "lr": 0.14783237651890885, "epoch": 0.9862458163340092, "percentage": 50.46, "elapsed_time": "21:14:58", "remaining_time": "20:51:36", "throughput": 334.2, "total_tokens": 25566208} {"current_steps": 20190, "total_steps": 40000, "loss": 0.0728, "lr": 0.14777347797606838, "epoch": 0.9864901179977036, "percentage": 50.48, "elapsed_time": "21:15:01", "remaining_time": "20:51:02", "throughput": 334.27, "total_tokens": 25572192} {"current_steps": 20195, "total_steps": 40000, "loss": 0.0465, "lr": 0.14771457977658553, "epoch": 0.9867344196613979, "percentage": 50.49, "elapsed_time": "21:15:04", "remaining_time": "20:50:27", "throughput": 334.33, "total_tokens": 25578048} {"current_steps": 20200, "total_steps": 40000, "loss": 0.0897, "lr": 0.14765568192954326, "epoch": 0.9869787213250922, "percentage": 50.5, "elapsed_time": "21:15:07", "remaining_time": "20:49:52", "throughput": 334.41, "total_tokens": 25584672} {"current_steps": 20200, "total_steps": 40000, "eval_loss": 0.06507953256368637, "epoch": 0.9869787213250922, "percentage": 50.5, "elapsed_time": "21:25:48", "remaining_time": "21:00:20", "throughput": 331.63, "total_tokens": 25584672} {"current_steps": 20205, "total_steps": 40000, "loss": 0.0697, "lr": 0.14759678444402421, "epoch": 0.9872230229887865, "percentage": 50.51, "elapsed_time": "21:25:51", "remaining_time": "20:59:46", "throughput": 331.69, "total_tokens": 25590528} {"current_steps": 20210, "total_steps": 40000, "loss": 0.0603, "lr": 0.14753788732911122, "epoch": 0.9874673246524809, "percentage": 50.52, "elapsed_time": "21:25:54", "remaining_time": "20:59:11", "throughput": 331.76, "total_tokens": 25596544} {"current_steps": 20215, "total_steps": 40000, "loss": 0.0572, "lr": 0.147478990593887, "epoch": 0.9877116263161753, "percentage": 50.54, "elapsed_time": "21:25:58", "remaining_time": "20:58:36", "throughput": 331.83, "total_tokens": 25603168} {"current_steps": 20220, "total_steps": 40000, "loss": 0.0632, "lr": 0.14742009424743405, "epoch": 0.9879559279798695, "percentage": 50.55, "elapsed_time": "21:26:01", "remaining_time": "20:58:01", "throughput": 331.89, "total_tokens": 25609024} {"current_steps": 20225, "total_steps": 40000, "loss": 0.0579, "lr": 0.14736119829883504, "epoch": 0.9882002296435639, "percentage": 50.56, "elapsed_time": "21:26:04", "remaining_time": "20:57:27", "throughput": 331.96, "total_tokens": 25615424} {"current_steps": 20230, "total_steps": 40000, "loss": 0.0824, "lr": 0.14730230275717243, "epoch": 0.9884445313072582, "percentage": 50.58, "elapsed_time": "21:26:07", "remaining_time": "20:56:52", "throughput": 332.02, "total_tokens": 25621280} {"current_steps": 20235, "total_steps": 40000, "loss": 0.0727, "lr": 0.14724340763152854, "epoch": 0.9886888329709526, "percentage": 50.59, "elapsed_time": "21:26:10", "remaining_time": "20:56:17", "throughput": 332.09, "total_tokens": 25627072} {"current_steps": 20240, "total_steps": 40000, "loss": 0.0727, "lr": 0.14718451293098594, "epoch": 0.9889331346346468, "percentage": 50.6, "elapsed_time": "21:26:13", "remaining_time": "20:55:42", "throughput": 332.15, "total_tokens": 25632928} {"current_steps": 20245, "total_steps": 40000, "loss": 0.0723, "lr": 0.14712561866462676, "epoch": 0.9891774362983412, "percentage": 50.61, "elapsed_time": "21:26:16", "remaining_time": "20:55:08", "throughput": 332.22, "total_tokens": 25639584} {"current_steps": 20250, "total_steps": 40000, "loss": 0.0446, "lr": 0.1470667248415333, "epoch": 0.9894217379620355, "percentage": 50.62, "elapsed_time": "21:26:19", "remaining_time": "20:54:33", "throughput": 332.29, "total_tokens": 25645824} {"current_steps": 20255, "total_steps": 40000, "loss": 0.0641, "lr": 0.1470078314707878, "epoch": 0.9896660396257299, "percentage": 50.64, "elapsed_time": "21:26:22", "remaining_time": "20:53:58", "throughput": 332.35, "total_tokens": 25651904} {"current_steps": 20260, "total_steps": 40000, "loss": 0.0659, "lr": 0.14694893856147223, "epoch": 0.9899103412894242, "percentage": 50.65, "elapsed_time": "21:26:25", "remaining_time": "20:53:24", "throughput": 332.43, "total_tokens": 25658624} {"current_steps": 20265, "total_steps": 40000, "loss": 0.0468, "lr": 0.14689004612266868, "epoch": 0.9901546429531185, "percentage": 50.66, "elapsed_time": "21:26:28", "remaining_time": "20:52:49", "throughput": 332.5, "total_tokens": 25665120} {"current_steps": 20270, "total_steps": 40000, "loss": 0.0768, "lr": 0.14683115416345913, "epoch": 0.9903989446168129, "percentage": 50.68, "elapsed_time": "21:26:31", "remaining_time": "20:52:15", "throughput": 332.57, "total_tokens": 25671520} {"current_steps": 20275, "total_steps": 40000, "loss": 0.0779, "lr": 0.1467722626929254, "epoch": 0.9906432462805072, "percentage": 50.69, "elapsed_time": "21:26:34", "remaining_time": "20:51:40", "throughput": 332.63, "total_tokens": 25677536} {"current_steps": 20280, "total_steps": 40000, "loss": 0.0529, "lr": 0.14671337172014937, "epoch": 0.9908875479442015, "percentage": 50.7, "elapsed_time": "21:26:37", "remaining_time": "20:51:05", "throughput": 332.69, "total_tokens": 25683232} {"current_steps": 20285, "total_steps": 40000, "loss": 0.0564, "lr": 0.14665448125421265, "epoch": 0.9911318496078958, "percentage": 50.71, "elapsed_time": "21:26:40", "remaining_time": "20:50:31", "throughput": 332.76, "total_tokens": 25689056} {"current_steps": 20290, "total_steps": 40000, "loss": 0.0511, "lr": 0.146595591304197, "epoch": 0.9913761512715902, "percentage": 50.72, "elapsed_time": "21:26:43", "remaining_time": "20:49:56", "throughput": 332.82, "total_tokens": 25695200} {"current_steps": 20295, "total_steps": 40000, "loss": 0.0643, "lr": 0.14653670187918397, "epoch": 0.9916204529352844, "percentage": 50.74, "elapsed_time": "21:26:46", "remaining_time": "20:49:22", "throughput": 332.89, "total_tokens": 25701184} {"current_steps": 20300, "total_steps": 40000, "loss": 0.0702, "lr": 0.14647781298825502, "epoch": 0.9918647545989788, "percentage": 50.75, "elapsed_time": "21:26:49", "remaining_time": "20:48:47", "throughput": 332.95, "total_tokens": 25706912} {"current_steps": 20305, "total_steps": 40000, "loss": 0.0619, "lr": 0.14641892464049153, "epoch": 0.9921090562626731, "percentage": 50.76, "elapsed_time": "21:26:52", "remaining_time": "20:48:13", "throughput": 333.02, "total_tokens": 25713024} {"current_steps": 20310, "total_steps": 40000, "loss": 0.0664, "lr": 0.14636003684497495, "epoch": 0.9923533579263675, "percentage": 50.78, "elapsed_time": "21:26:55", "remaining_time": "20:47:38", "throughput": 333.08, "total_tokens": 25719456} {"current_steps": 20315, "total_steps": 40000, "loss": 0.0508, "lr": 0.14630114961078636, "epoch": 0.9925976595900619, "percentage": 50.79, "elapsed_time": "21:26:58", "remaining_time": "20:47:04", "throughput": 333.15, "total_tokens": 25725600} {"current_steps": 20320, "total_steps": 40000, "loss": 0.0742, "lr": 0.14624226294700704, "epoch": 0.9928419612537561, "percentage": 50.8, "elapsed_time": "21:27:02", "remaining_time": "20:46:29", "throughput": 333.22, "total_tokens": 25732160} {"current_steps": 20325, "total_steps": 40000, "loss": 0.0453, "lr": 0.14618337686271793, "epoch": 0.9930862629174505, "percentage": 50.81, "elapsed_time": "21:27:05", "remaining_time": "20:45:55", "throughput": 333.29, "total_tokens": 25738496} {"current_steps": 20330, "total_steps": 40000, "loss": 0.0426, "lr": 0.1461244913670001, "epoch": 0.9933305645811448, "percentage": 50.82, "elapsed_time": "21:27:08", "remaining_time": "20:45:21", "throughput": 333.36, "total_tokens": 25745056} {"current_steps": 20335, "total_steps": 40000, "loss": 0.0487, "lr": 0.1460656064689344, "epoch": 0.9935748662448391, "percentage": 50.84, "elapsed_time": "21:27:11", "remaining_time": "20:44:46", "throughput": 333.43, "total_tokens": 25751328} {"current_steps": 20340, "total_steps": 40000, "loss": 0.044, "lr": 0.14600672217760163, "epoch": 0.9938191679085334, "percentage": 50.85, "elapsed_time": "21:27:14", "remaining_time": "20:44:12", "throughput": 333.5, "total_tokens": 25757504} {"current_steps": 20345, "total_steps": 40000, "loss": 0.0646, "lr": 0.14594783850208248, "epoch": 0.9940634695722278, "percentage": 50.86, "elapsed_time": "21:27:17", "remaining_time": "20:43:38", "throughput": 333.58, "total_tokens": 25765216} {"current_steps": 20350, "total_steps": 40000, "loss": 0.0602, "lr": 0.14588895545145758, "epoch": 0.9943077712359221, "percentage": 50.88, "elapsed_time": "21:27:20", "remaining_time": "20:43:04", "throughput": 333.65, "total_tokens": 25771648} {"current_steps": 20355, "total_steps": 40000, "loss": 0.0871, "lr": 0.14583007303480738, "epoch": 0.9945520728996164, "percentage": 50.89, "elapsed_time": "21:27:24", "remaining_time": "20:42:29", "throughput": 333.72, "total_tokens": 25777984} {"current_steps": 20360, "total_steps": 40000, "loss": 0.0535, "lr": 0.14577119126121235, "epoch": 0.9947963745633108, "percentage": 50.9, "elapsed_time": "21:27:27", "remaining_time": "20:41:55", "throughput": 333.79, "total_tokens": 25784320} {"current_steps": 20365, "total_steps": 40000, "loss": 0.0733, "lr": 0.14571231013975272, "epoch": 0.9950406762270051, "percentage": 50.91, "elapsed_time": "21:27:30", "remaining_time": "20:41:21", "throughput": 333.87, "total_tokens": 25791168} {"current_steps": 20370, "total_steps": 40000, "loss": 0.0625, "lr": 0.1456534296795088, "epoch": 0.9952849778906995, "percentage": 50.92, "elapsed_time": "21:27:33", "remaining_time": "20:40:46", "throughput": 333.94, "total_tokens": 25797888} {"current_steps": 20375, "total_steps": 40000, "loss": 0.0536, "lr": 0.14559454988956066, "epoch": 0.9955292795543937, "percentage": 50.94, "elapsed_time": "21:27:36", "remaining_time": "20:40:12", "throughput": 334.0, "total_tokens": 25803488} {"current_steps": 20380, "total_steps": 40000, "loss": 0.0543, "lr": 0.1455356707789882, "epoch": 0.9957735812180881, "percentage": 50.95, "elapsed_time": "21:27:39", "remaining_time": "20:39:38", "throughput": 334.06, "total_tokens": 25809280} {"current_steps": 20385, "total_steps": 40000, "loss": 0.0789, "lr": 0.14547679235687147, "epoch": 0.9960178828817824, "percentage": 50.96, "elapsed_time": "21:27:42", "remaining_time": "20:39:03", "throughput": 334.12, "total_tokens": 25815104} {"current_steps": 20390, "total_steps": 40000, "loss": 0.0957, "lr": 0.14541791463229023, "epoch": 0.9962621845454768, "percentage": 50.98, "elapsed_time": "21:27:45", "remaining_time": "20:38:29", "throughput": 334.19, "total_tokens": 25821440} {"current_steps": 20395, "total_steps": 40000, "loss": 0.0594, "lr": 0.14535903761432406, "epoch": 0.996506486209171, "percentage": 50.99, "elapsed_time": "21:27:48", "remaining_time": "20:37:55", "throughput": 334.27, "total_tokens": 25828320} {"current_steps": 20400, "total_steps": 40000, "loss": 0.0617, "lr": 0.1453001613120527, "epoch": 0.9967507878728654, "percentage": 51.0, "elapsed_time": "21:27:51", "remaining_time": "20:37:21", "throughput": 334.33, "total_tokens": 25834336} {"current_steps": 20400, "total_steps": 40000, "eval_loss": 0.06505754590034485, "epoch": 0.9967507878728654, "percentage": 51.0, "elapsed_time": "21:38:31", "remaining_time": "20:47:36", "throughput": 331.58, "total_tokens": 25834336} {"current_steps": 20405, "total_steps": 40000, "loss": 0.0498, "lr": 0.14524128573455547, "epoch": 0.9969950895365598, "percentage": 51.01, "elapsed_time": "21:38:35", "remaining_time": "20:47:02", "throughput": 331.65, "total_tokens": 25840736} {"current_steps": 20410, "total_steps": 40000, "loss": 0.0511, "lr": 0.14518241089091177, "epoch": 0.9972393912002541, "percentage": 51.02, "elapsed_time": "21:38:38", "remaining_time": "20:46:28", "throughput": 331.72, "total_tokens": 25846944} {"current_steps": 20415, "total_steps": 40000, "loss": 0.0792, "lr": 0.1451235367902009, "epoch": 0.9974836928639484, "percentage": 51.04, "elapsed_time": "21:38:42", "remaining_time": "20:45:53", "throughput": 331.78, "total_tokens": 25853184} {"current_steps": 20420, "total_steps": 40000, "loss": 0.0745, "lr": 0.1450646634415019, "epoch": 0.9977279945276427, "percentage": 51.05, "elapsed_time": "21:38:45", "remaining_time": "20:45:19", "throughput": 331.85, "total_tokens": 25859680} {"current_steps": 20425, "total_steps": 40000, "loss": 0.063, "lr": 0.1450057908538938, "epoch": 0.9979722961913371, "percentage": 51.06, "elapsed_time": "21:38:48", "remaining_time": "20:44:45", "throughput": 331.92, "total_tokens": 25865600} {"current_steps": 20430, "total_steps": 40000, "loss": 0.0941, "lr": 0.14494691903645557, "epoch": 0.9982165978550314, "percentage": 51.08, "elapsed_time": "21:38:51", "remaining_time": "20:44:10", "throughput": 331.98, "total_tokens": 25871392} {"current_steps": 20435, "total_steps": 40000, "loss": 0.0714, "lr": 0.14488804799826588, "epoch": 0.9984608995187257, "percentage": 51.09, "elapsed_time": "21:38:54", "remaining_time": "20:43:36", "throughput": 332.05, "total_tokens": 25878016} {"current_steps": 20440, "total_steps": 40000, "loss": 0.0553, "lr": 0.14482917774840348, "epoch": 0.99870520118242, "percentage": 51.1, "elapsed_time": "21:38:57", "remaining_time": "20:43:02", "throughput": 332.12, "total_tokens": 25884832} {"current_steps": 20445, "total_steps": 40000, "loss": 0.0497, "lr": 0.14477030829594684, "epoch": 0.9989495028461144, "percentage": 51.11, "elapsed_time": "21:39:00", "remaining_time": "20:42:27", "throughput": 332.19, "total_tokens": 25891104} {"current_steps": 20450, "total_steps": 40000, "loss": 0.0581, "lr": 0.14471143964997432, "epoch": 0.9991938045098087, "percentage": 51.12, "elapsed_time": "21:39:03", "remaining_time": "20:41:53", "throughput": 332.26, "total_tokens": 25897280} {"current_steps": 20455, "total_steps": 40000, "loss": 0.0361, "lr": 0.14465257181956434, "epoch": 0.999438106173503, "percentage": 51.14, "elapsed_time": "21:39:06", "remaining_time": "20:41:19", "throughput": 332.33, "total_tokens": 25903744} {"current_steps": 20460, "total_steps": 40000, "loss": 0.0669, "lr": 0.1445937048137949, "epoch": 0.9996824078371974, "percentage": 51.15, "elapsed_time": "21:39:09", "remaining_time": "20:40:44", "throughput": 332.39, "total_tokens": 25909824} {"current_steps": 20465, "total_steps": 40000, "loss": 0.0224, "lr": 0.14453483864174416, "epoch": 0.9999267095008917, "percentage": 51.16, "elapsed_time": "21:39:12", "remaining_time": "20:40:10", "throughput": 332.46, "total_tokens": 25916416} {"current_steps": 20470, "total_steps": 40000, "loss": 0.0613, "lr": 0.14447597331249, "epoch": 1.0001954413309555, "percentage": 51.18, "elapsed_time": "21:39:16", "remaining_time": "20:39:36", "throughput": 332.53, "total_tokens": 25922848} {"current_steps": 20475, "total_steps": 40000, "loss": 0.0773, "lr": 0.1444171088351102, "epoch": 1.0004397429946499, "percentage": 51.19, "elapsed_time": "21:39:19", "remaining_time": "20:39:02", "throughput": 332.6, "total_tokens": 25929280} {"current_steps": 20480, "total_steps": 40000, "loss": 0.0457, "lr": 0.14435824521868235, "epoch": 1.000684044658344, "percentage": 51.2, "elapsed_time": "21:39:22", "remaining_time": "20:38:28", "throughput": 332.67, "total_tokens": 25936000} {"current_steps": 20485, "total_steps": 40000, "loss": 0.1044, "lr": 0.14429938247228397, "epoch": 1.0009283463220384, "percentage": 51.21, "elapsed_time": "21:39:25", "remaining_time": "20:37:53", "throughput": 332.74, "total_tokens": 25941920} {"current_steps": 20490, "total_steps": 40000, "loss": 0.0933, "lr": 0.14424052060499243, "epoch": 1.0011726479857328, "percentage": 51.23, "elapsed_time": "21:39:29", "remaining_time": "20:37:20", "throughput": 332.82, "total_tokens": 25949888} {"current_steps": 20495, "total_steps": 40000, "loss": 0.0644, "lr": 0.14418165962588506, "epoch": 1.0014169496494272, "percentage": 51.24, "elapsed_time": "21:39:32", "remaining_time": "20:36:45", "throughput": 332.89, "total_tokens": 25956064} {"current_steps": 20500, "total_steps": 40000, "loss": 0.0661, "lr": 0.1441227995440388, "epoch": 1.0016612513131213, "percentage": 51.25, "elapsed_time": "21:39:35", "remaining_time": "20:36:11", "throughput": 332.95, "total_tokens": 25962240} {"current_steps": 20505, "total_steps": 40000, "loss": 0.0834, "lr": 0.14406394036853082, "epoch": 1.0019055529768157, "percentage": 51.26, "elapsed_time": "21:39:38", "remaining_time": "20:35:37", "throughput": 333.02, "total_tokens": 25968512} {"current_steps": 20510, "total_steps": 40000, "loss": 0.0899, "lr": 0.14400508210843774, "epoch": 1.00214985464051, "percentage": 51.28, "elapsed_time": "21:39:41", "remaining_time": "20:35:03", "throughput": 333.1, "total_tokens": 25975456} {"current_steps": 20515, "total_steps": 40000, "loss": 0.0563, "lr": 0.1439462247728364, "epoch": 1.0023941563042045, "percentage": 51.29, "elapsed_time": "21:39:44", "remaining_time": "20:34:29", "throughput": 333.17, "total_tokens": 25981984} {"current_steps": 20520, "total_steps": 40000, "loss": 0.046, "lr": 0.14388736837080326, "epoch": 1.0026384579678989, "percentage": 51.3, "elapsed_time": "21:39:47", "remaining_time": "20:33:55", "throughput": 333.24, "total_tokens": 25988256} {"current_steps": 20525, "total_steps": 40000, "loss": 0.079, "lr": 0.14382851291141469, "epoch": 1.002882759631593, "percentage": 51.31, "elapsed_time": "21:39:50", "remaining_time": "20:33:20", "throughput": 333.31, "total_tokens": 25994752} {"current_steps": 20530, "total_steps": 40000, "loss": 0.0661, "lr": 0.14376965840374697, "epoch": 1.0031270612952874, "percentage": 51.32, "elapsed_time": "21:39:53", "remaining_time": "20:32:46", "throughput": 333.38, "total_tokens": 26001504} {"current_steps": 20535, "total_steps": 40000, "loss": 0.0496, "lr": 0.14371080485687632, "epoch": 1.0033713629589818, "percentage": 51.34, "elapsed_time": "21:39:57", "remaining_time": "20:32:12", "throughput": 333.45, "total_tokens": 26007968} {"current_steps": 20540, "total_steps": 40000, "loss": 0.07, "lr": 0.1436519522798785, "epoch": 1.0036156646226762, "percentage": 51.35, "elapsed_time": "21:40:00", "remaining_time": "20:31:38", "throughput": 333.51, "total_tokens": 26014080} {"current_steps": 20545, "total_steps": 40000, "loss": 0.0427, "lr": 0.14359310068182948, "epoch": 1.0038599662863703, "percentage": 51.36, "elapsed_time": "21:40:03", "remaining_time": "20:31:04", "throughput": 333.59, "total_tokens": 26020832} {"current_steps": 20550, "total_steps": 40000, "loss": 0.0868, "lr": 0.14353425007180484, "epoch": 1.0041042679500647, "percentage": 51.38, "elapsed_time": "21:40:06", "remaining_time": "20:30:30", "throughput": 333.66, "total_tokens": 26027552} {"current_steps": 20555, "total_steps": 40000, "loss": 0.0521, "lr": 0.14347540045888005, "epoch": 1.004348569613759, "percentage": 51.39, "elapsed_time": "21:40:09", "remaining_time": "20:29:56", "throughput": 333.72, "total_tokens": 26033664} {"current_steps": 20560, "total_steps": 40000, "loss": 0.0578, "lr": 0.14341655185213056, "epoch": 1.0045928712774534, "percentage": 51.4, "elapsed_time": "21:40:12", "remaining_time": "20:29:22", "throughput": 333.79, "total_tokens": 26040000} {"current_steps": 20565, "total_steps": 40000, "loss": 0.0476, "lr": 0.14335770426063144, "epoch": 1.0048371729411478, "percentage": 51.41, "elapsed_time": "21:40:15", "remaining_time": "20:28:48", "throughput": 333.86, "total_tokens": 26045984} {"current_steps": 20570, "total_steps": 40000, "loss": 0.0472, "lr": 0.1432988576934578, "epoch": 1.005081474604842, "percentage": 51.42, "elapsed_time": "21:40:18", "remaining_time": "20:28:14", "throughput": 333.92, "total_tokens": 26052000} {"current_steps": 20575, "total_steps": 40000, "loss": 0.0404, "lr": 0.14324001215968457, "epoch": 1.0053257762685364, "percentage": 51.44, "elapsed_time": "21:40:21", "remaining_time": "20:27:40", "throughput": 333.99, "total_tokens": 26058528} {"current_steps": 20580, "total_steps": 40000, "loss": 0.0613, "lr": 0.14318116766838637, "epoch": 1.0055700779322307, "percentage": 51.45, "elapsed_time": "21:40:24", "remaining_time": "20:27:06", "throughput": 334.06, "total_tokens": 26065216} {"current_steps": 20585, "total_steps": 40000, "loss": 0.0532, "lr": 0.14312232422863788, "epoch": 1.0058143795959251, "percentage": 51.46, "elapsed_time": "21:40:27", "remaining_time": "20:26:33", "throughput": 334.13, "total_tokens": 26071520} {"current_steps": 20590, "total_steps": 40000, "loss": 0.0507, "lr": 0.14306348184951334, "epoch": 1.0060586812596193, "percentage": 51.48, "elapsed_time": "21:40:31", "remaining_time": "20:25:59", "throughput": 334.2, "total_tokens": 26077952} {"current_steps": 20595, "total_steps": 40000, "loss": 0.0462, "lr": 0.1430046405400871, "epoch": 1.0063029829233137, "percentage": 51.49, "elapsed_time": "21:40:34", "remaining_time": "20:25:25", "throughput": 334.27, "total_tokens": 26084128} {"current_steps": 20600, "total_steps": 40000, "loss": 0.064, "lr": 0.14294580030943324, "epoch": 1.006547284587008, "percentage": 51.5, "elapsed_time": "21:40:37", "remaining_time": "20:24:51", "throughput": 334.33, "total_tokens": 26090080} {"current_steps": 20600, "total_steps": 40000, "eval_loss": 0.0667826235294342, "epoch": 1.006547284587008, "percentage": 51.5, "elapsed_time": "21:51:17", "remaining_time": "20:34:54", "throughput": 331.61, "total_tokens": 26090080} {"current_steps": 20605, "total_steps": 40000, "loss": 0.0487, "lr": 0.14288696116662553, "epoch": 1.0067915862507024, "percentage": 51.51, "elapsed_time": "21:51:24", "remaining_time": "20:34:23", "throughput": 331.66, "total_tokens": 26096384} {"current_steps": 20610, "total_steps": 40000, "loss": 0.0496, "lr": 0.1428281231207378, "epoch": 1.0070358879143968, "percentage": 51.52, "elapsed_time": "21:51:27", "remaining_time": "20:33:49", "throughput": 331.72, "total_tokens": 26102560} {"current_steps": 20615, "total_steps": 40000, "loss": 0.0599, "lr": 0.1427692861808437, "epoch": 1.007280189578091, "percentage": 51.54, "elapsed_time": "21:51:30", "remaining_time": "20:33:15", "throughput": 331.79, "total_tokens": 26109056} {"current_steps": 20620, "total_steps": 40000, "loss": 0.0473, "lr": 0.1427104503560165, "epoch": 1.0075244912417853, "percentage": 51.55, "elapsed_time": "21:51:33", "remaining_time": "20:32:41", "throughput": 331.86, "total_tokens": 26115104} {"current_steps": 20625, "total_steps": 40000, "loss": 0.0665, "lr": 0.14265161565532947, "epoch": 1.0077687929054797, "percentage": 51.56, "elapsed_time": "21:51:36", "remaining_time": "20:32:07", "throughput": 331.92, "total_tokens": 26121248} {"current_steps": 20630, "total_steps": 40000, "loss": 0.0298, "lr": 0.14259278208785564, "epoch": 1.008013094569174, "percentage": 51.58, "elapsed_time": "21:51:40", "remaining_time": "20:31:33", "throughput": 332.0, "total_tokens": 26128032} {"current_steps": 20635, "total_steps": 40000, "loss": 0.067, "lr": 0.14253394966266789, "epoch": 1.0082573962328683, "percentage": 51.59, "elapsed_time": "21:51:43", "remaining_time": "20:30:59", "throughput": 332.06, "total_tokens": 26134176} {"current_steps": 20640, "total_steps": 40000, "loss": 0.0826, "lr": 0.14247511838883894, "epoch": 1.0085016978965626, "percentage": 51.6, "elapsed_time": "21:51:46", "remaining_time": "20:30:25", "throughput": 332.13, "total_tokens": 26140416} {"current_steps": 20645, "total_steps": 40000, "loss": 0.1135, "lr": 0.14241628827544126, "epoch": 1.008745999560257, "percentage": 51.61, "elapsed_time": "21:51:49", "remaining_time": "20:29:51", "throughput": 332.19, "total_tokens": 26146304} {"current_steps": 20650, "total_steps": 40000, "loss": 0.0707, "lr": 0.14235745933154723, "epoch": 1.0089903012239514, "percentage": 51.62, "elapsed_time": "21:51:52", "remaining_time": "20:29:16", "throughput": 332.25, "total_tokens": 26152448} {"current_steps": 20655, "total_steps": 40000, "loss": 0.0544, "lr": 0.14229863156622907, "epoch": 1.0092346028876458, "percentage": 51.64, "elapsed_time": "21:51:55", "remaining_time": "20:28:42", "throughput": 332.32, "total_tokens": 26158976} {"current_steps": 20660, "total_steps": 40000, "loss": 0.0583, "lr": 0.14223980498855868, "epoch": 1.00947890455134, "percentage": 51.65, "elapsed_time": "21:51:58", "remaining_time": "20:28:09", "throughput": 332.39, "total_tokens": 26165184} {"current_steps": 20665, "total_steps": 40000, "loss": 0.0539, "lr": 0.14218097960760792, "epoch": 1.0097232062150343, "percentage": 51.66, "elapsed_time": "21:52:01", "remaining_time": "20:27:34", "throughput": 332.45, "total_tokens": 26171072} {"current_steps": 20670, "total_steps": 40000, "loss": 0.058, "lr": 0.1421221554324483, "epoch": 1.0099675078787287, "percentage": 51.68, "elapsed_time": "21:52:04", "remaining_time": "20:27:00", "throughput": 332.52, "total_tokens": 26177472} {"current_steps": 20675, "total_steps": 40000, "loss": 0.059, "lr": 0.1420633324721513, "epoch": 1.010211809542423, "percentage": 51.69, "elapsed_time": "21:52:07", "remaining_time": "20:26:27", "throughput": 332.59, "total_tokens": 26184384} {"current_steps": 20680, "total_steps": 40000, "loss": 0.0946, "lr": 0.14200451073578824, "epoch": 1.0104561112061172, "percentage": 51.7, "elapsed_time": "21:52:10", "remaining_time": "20:25:53", "throughput": 332.66, "total_tokens": 26190720} {"current_steps": 20685, "total_steps": 40000, "loss": 0.0582, "lr": 0.14194569023243003, "epoch": 1.0107004128698116, "percentage": 51.71, "elapsed_time": "21:52:13", "remaining_time": "20:25:19", "throughput": 332.73, "total_tokens": 26196960} {"current_steps": 20690, "total_steps": 40000, "loss": 0.083, "lr": 0.14188687097114766, "epoch": 1.010944714533506, "percentage": 51.73, "elapsed_time": "21:52:17", "remaining_time": "20:24:45", "throughput": 332.8, "total_tokens": 26203584} {"current_steps": 20695, "total_steps": 40000, "loss": 0.0769, "lr": 0.14182805296101172, "epoch": 1.0111890161972004, "percentage": 51.74, "elapsed_time": "21:52:20", "remaining_time": "20:24:11", "throughput": 332.86, "total_tokens": 26209824} {"current_steps": 20700, "total_steps": 40000, "loss": 0.0633, "lr": 0.14176923621109272, "epoch": 1.0114333178608947, "percentage": 51.75, "elapsed_time": "21:52:23", "remaining_time": "20:23:37", "throughput": 332.93, "total_tokens": 26216256} {"current_steps": 20705, "total_steps": 40000, "loss": 0.0684, "lr": 0.14171042073046097, "epoch": 1.011677619524589, "percentage": 51.76, "elapsed_time": "21:52:26", "remaining_time": "20:23:03", "throughput": 333.0, "total_tokens": 26222336} {"current_steps": 20710, "total_steps": 40000, "loss": 0.0437, "lr": 0.14165160652818642, "epoch": 1.0119219211882833, "percentage": 51.78, "elapsed_time": "21:52:29", "remaining_time": "20:22:29", "throughput": 333.07, "total_tokens": 26228672} {"current_steps": 20715, "total_steps": 40000, "loss": 0.0481, "lr": 0.14159279361333907, "epoch": 1.0121662228519777, "percentage": 51.79, "elapsed_time": "21:52:32", "remaining_time": "20:21:55", "throughput": 333.13, "total_tokens": 26234752} {"current_steps": 20720, "total_steps": 40000, "loss": 0.0744, "lr": 0.14153398199498868, "epoch": 1.012410524515672, "percentage": 51.8, "elapsed_time": "21:52:35", "remaining_time": "20:21:22", "throughput": 333.21, "total_tokens": 26241952} {"current_steps": 20725, "total_steps": 40000, "loss": 0.0573, "lr": 0.14147517168220458, "epoch": 1.0126548261793662, "percentage": 51.81, "elapsed_time": "21:52:38", "remaining_time": "20:20:48", "throughput": 333.28, "total_tokens": 26248480} {"current_steps": 20730, "total_steps": 40000, "loss": 0.0894, "lr": 0.14141636268405616, "epoch": 1.0128991278430606, "percentage": 51.82, "elapsed_time": "21:52:41", "remaining_time": "20:20:14", "throughput": 333.34, "total_tokens": 26254496} {"current_steps": 20735, "total_steps": 40000, "loss": 0.0431, "lr": 0.14135755500961253, "epoch": 1.013143429506755, "percentage": 51.84, "elapsed_time": "21:52:44", "remaining_time": "20:19:40", "throughput": 333.41, "total_tokens": 26260960} {"current_steps": 20740, "total_steps": 40000, "loss": 0.0662, "lr": 0.14129874866794245, "epoch": 1.0133877311704493, "percentage": 51.85, "elapsed_time": "21:52:48", "remaining_time": "20:19:07", "throughput": 333.48, "total_tokens": 26267296} {"current_steps": 20745, "total_steps": 40000, "loss": 0.0537, "lr": 0.14123994366811476, "epoch": 1.0136320328341435, "percentage": 51.86, "elapsed_time": "21:52:51", "remaining_time": "20:18:33", "throughput": 333.54, "total_tokens": 26273696} {"current_steps": 20750, "total_steps": 40000, "loss": 0.0395, "lr": 0.14118114001919774, "epoch": 1.0138763344978379, "percentage": 51.88, "elapsed_time": "21:52:54", "remaining_time": "20:17:59", "throughput": 333.62, "total_tokens": 26280736} {"current_steps": 20755, "total_steps": 40000, "loss": 0.0593, "lr": 0.14112233773025978, "epoch": 1.0141206361615323, "percentage": 51.89, "elapsed_time": "21:52:57", "remaining_time": "20:17:26", "throughput": 333.69, "total_tokens": 26287424} {"current_steps": 20760, "total_steps": 40000, "loss": 0.0492, "lr": 0.14106353681036896, "epoch": 1.0143649378252266, "percentage": 51.9, "elapsed_time": "21:53:00", "remaining_time": "20:16:52", "throughput": 333.76, "total_tokens": 26293632} {"current_steps": 20765, "total_steps": 40000, "loss": 0.0928, "lr": 0.14100473726859303, "epoch": 1.014609239488921, "percentage": 51.91, "elapsed_time": "21:53:03", "remaining_time": "20:16:18", "throughput": 333.82, "total_tokens": 26299904} {"current_steps": 20770, "total_steps": 40000, "loss": 0.0651, "lr": 0.14094593911399964, "epoch": 1.0148535411526152, "percentage": 51.92, "elapsed_time": "21:53:06", "remaining_time": "20:15:45", "throughput": 333.88, "total_tokens": 26305696} {"current_steps": 20775, "total_steps": 40000, "loss": 0.0541, "lr": 0.14088714235565625, "epoch": 1.0150978428163095, "percentage": 51.94, "elapsed_time": "21:53:09", "remaining_time": "20:15:11", "throughput": 333.95, "total_tokens": 26311808} {"current_steps": 20780, "total_steps": 40000, "loss": 0.0413, "lr": 0.14082834700263, "epoch": 1.015342144480004, "percentage": 51.95, "elapsed_time": "21:53:12", "remaining_time": "20:14:37", "throughput": 334.02, "total_tokens": 26318176} {"current_steps": 20785, "total_steps": 40000, "loss": 0.0529, "lr": 0.14076955306398795, "epoch": 1.0155864461436983, "percentage": 51.96, "elapsed_time": "21:53:15", "remaining_time": "20:14:03", "throughput": 334.08, "total_tokens": 26324384} {"current_steps": 20790, "total_steps": 40000, "loss": 0.0702, "lr": 0.14071076054879675, "epoch": 1.0158307478073925, "percentage": 51.98, "elapsed_time": "21:53:18", "remaining_time": "20:13:30", "throughput": 334.15, "total_tokens": 26330496} {"current_steps": 20795, "total_steps": 40000, "loss": 0.0623, "lr": 0.14065196946612302, "epoch": 1.0160750494710868, "percentage": 51.99, "elapsed_time": "21:53:21", "remaining_time": "20:12:56", "throughput": 334.21, "total_tokens": 26336768} {"current_steps": 20800, "total_steps": 40000, "loss": 0.0855, "lr": 0.1405931798250331, "epoch": 1.0163193511347812, "percentage": 52.0, "elapsed_time": "21:53:25", "remaining_time": "20:12:23", "throughput": 334.28, "total_tokens": 26343008} {"current_steps": 20800, "total_steps": 40000, "eval_loss": 0.06624678522348404, "epoch": 1.0163193511347812, "percentage": 52.0, "elapsed_time": "22:04:04", "remaining_time": "20:22:13", "throughput": 331.59, "total_tokens": 26343008} {"current_steps": 20805, "total_steps": 40000, "loss": 0.0758, "lr": 0.14053439163459308, "epoch": 1.0165636527984756, "percentage": 52.01, "elapsed_time": "22:04:08", "remaining_time": "20:21:40", "throughput": 331.66, "total_tokens": 26350112} {"current_steps": 20810, "total_steps": 40000, "loss": 0.0722, "lr": 0.14047560490386876, "epoch": 1.01680795446217, "percentage": 52.02, "elapsed_time": "22:04:11", "remaining_time": "20:21:06", "throughput": 331.73, "total_tokens": 26356672} {"current_steps": 20815, "total_steps": 40000, "loss": 0.0581, "lr": 0.14041681964192593, "epoch": 1.0170522561258641, "percentage": 52.04, "elapsed_time": "22:04:15", "remaining_time": "20:20:33", "throughput": 331.81, "total_tokens": 26363872} {"current_steps": 20820, "total_steps": 40000, "loss": 0.0445, "lr": 0.14035803585782988, "epoch": 1.0172965577895585, "percentage": 52.05, "elapsed_time": "22:04:18", "remaining_time": "20:19:59", "throughput": 331.88, "total_tokens": 26370528} {"current_steps": 20825, "total_steps": 40000, "loss": 0.0482, "lr": 0.14029925356064593, "epoch": 1.017540859453253, "percentage": 52.06, "elapsed_time": "22:04:21", "remaining_time": "20:19:25", "throughput": 331.95, "total_tokens": 26377088} {"current_steps": 20830, "total_steps": 40000, "loss": 0.0469, "lr": 0.1402404727594389, "epoch": 1.0177851611169473, "percentage": 52.08, "elapsed_time": "22:04:24", "remaining_time": "20:18:51", "throughput": 332.01, "total_tokens": 26383008} {"current_steps": 20835, "total_steps": 40000, "loss": 0.0452, "lr": 0.1401816934632737, "epoch": 1.0180294627806414, "percentage": 52.09, "elapsed_time": "22:04:27", "remaining_time": "20:18:17", "throughput": 332.08, "total_tokens": 26389248} {"current_steps": 20840, "total_steps": 40000, "loss": 0.0549, "lr": 0.1401229156812147, "epoch": 1.0182737644443358, "percentage": 52.1, "elapsed_time": "22:04:30", "remaining_time": "20:17:44", "throughput": 332.15, "total_tokens": 26395904} {"current_steps": 20845, "total_steps": 40000, "loss": 0.0645, "lr": 0.14006413942232626, "epoch": 1.0185180661080302, "percentage": 52.11, "elapsed_time": "22:04:33", "remaining_time": "20:17:10", "throughput": 332.21, "total_tokens": 26402208} {"current_steps": 20850, "total_steps": 40000, "loss": 0.0378, "lr": 0.14000536469567235, "epoch": 1.0187623677717246, "percentage": 52.12, "elapsed_time": "22:04:36", "remaining_time": "20:16:36", "throughput": 332.28, "total_tokens": 26408832} {"current_steps": 20855, "total_steps": 40000, "loss": 0.0669, "lr": 0.13994659151031685, "epoch": 1.019006669435419, "percentage": 52.14, "elapsed_time": "22:04:40", "remaining_time": "20:16:03", "throughput": 332.35, "total_tokens": 26415520} {"current_steps": 20860, "total_steps": 40000, "loss": 0.0675, "lr": 0.13988781987532323, "epoch": 1.0192509710991131, "percentage": 52.15, "elapsed_time": "22:04:43", "remaining_time": "20:15:29", "throughput": 332.42, "total_tokens": 26421632} {"current_steps": 20865, "total_steps": 40000, "loss": 0.0487, "lr": 0.1398290497997549, "epoch": 1.0194952727628075, "percentage": 52.16, "elapsed_time": "22:04:46", "remaining_time": "20:14:55", "throughput": 332.49, "total_tokens": 26428000} {"current_steps": 20870, "total_steps": 40000, "loss": 0.0644, "lr": 0.13977028129267488, "epoch": 1.0197395744265019, "percentage": 52.18, "elapsed_time": "22:04:49", "remaining_time": "20:14:21", "throughput": 332.55, "total_tokens": 26434368} {"current_steps": 20875, "total_steps": 40000, "loss": 0.0506, "lr": 0.13971151436314605, "epoch": 1.0199838760901963, "percentage": 52.19, "elapsed_time": "22:04:52", "remaining_time": "20:13:48", "throughput": 332.62, "total_tokens": 26440704} {"current_steps": 20880, "total_steps": 40000, "loss": 0.0849, "lr": 0.13965274902023103, "epoch": 1.0202281777538904, "percentage": 52.2, "elapsed_time": "22:04:55", "remaining_time": "20:13:14", "throughput": 332.68, "total_tokens": 26446944} {"current_steps": 20885, "total_steps": 40000, "loss": 0.0903, "lr": 0.13959398527299208, "epoch": 1.0204724794175848, "percentage": 52.21, "elapsed_time": "22:04:58", "remaining_time": "20:12:41", "throughput": 332.75, "total_tokens": 26453312} {"current_steps": 20890, "total_steps": 40000, "loss": 0.0462, "lr": 0.13953522313049138, "epoch": 1.0207167810812792, "percentage": 52.23, "elapsed_time": "22:05:01", "remaining_time": "20:12:07", "throughput": 332.82, "total_tokens": 26459584} {"current_steps": 20895, "total_steps": 40000, "loss": 0.0625, "lr": 0.13947646260179083, "epoch": 1.0209610827449735, "percentage": 52.24, "elapsed_time": "22:05:04", "remaining_time": "20:11:33", "throughput": 332.89, "total_tokens": 26466272} {"current_steps": 20900, "total_steps": 40000, "loss": 0.0761, "lr": 0.13941770369595194, "epoch": 1.021205384408668, "percentage": 52.25, "elapsed_time": "22:05:07", "remaining_time": "20:11:00", "throughput": 332.95, "total_tokens": 26472192} {"current_steps": 20905, "total_steps": 40000, "loss": 0.0583, "lr": 0.1393589464220362, "epoch": 1.021449686072362, "percentage": 52.26, "elapsed_time": "22:05:10", "remaining_time": "20:10:26", "throughput": 333.02, "total_tokens": 26478528} {"current_steps": 20910, "total_steps": 40000, "loss": 0.0692, "lr": 0.13930019078910455, "epoch": 1.0216939877360565, "percentage": 52.28, "elapsed_time": "22:05:13", "remaining_time": "20:09:53", "throughput": 333.09, "total_tokens": 26484928} {"current_steps": 20915, "total_steps": 40000, "loss": 0.0417, "lr": 0.139241436806218, "epoch": 1.0219382893997508, "percentage": 52.29, "elapsed_time": "22:05:16", "remaining_time": "20:09:19", "throughput": 333.15, "total_tokens": 26491168} {"current_steps": 20920, "total_steps": 40000, "loss": 0.0862, "lr": 0.13918268448243712, "epoch": 1.0221825910634452, "percentage": 52.3, "elapsed_time": "22:05:20", "remaining_time": "20:08:45", "throughput": 333.21, "total_tokens": 26497120} {"current_steps": 20925, "total_steps": 40000, "loss": 0.0588, "lr": 0.13912393382682217, "epoch": 1.0224268927271394, "percentage": 52.31, "elapsed_time": "22:05:23", "remaining_time": "20:08:12", "throughput": 333.29, "total_tokens": 26503968} {"current_steps": 20930, "total_steps": 40000, "loss": 0.0636, "lr": 0.1390651848484333, "epoch": 1.0226711943908338, "percentage": 52.33, "elapsed_time": "22:05:26", "remaining_time": "20:07:39", "throughput": 333.36, "total_tokens": 26510784} {"current_steps": 20935, "total_steps": 40000, "loss": 0.0498, "lr": 0.1390064375563304, "epoch": 1.0229154960545281, "percentage": 52.34, "elapsed_time": "22:05:29", "remaining_time": "20:07:05", "throughput": 333.42, "total_tokens": 26516736} {"current_steps": 20940, "total_steps": 40000, "loss": 0.0538, "lr": 0.13894769195957293, "epoch": 1.0231597977182225, "percentage": 52.35, "elapsed_time": "22:05:32", "remaining_time": "20:06:32", "throughput": 333.49, "total_tokens": 26522944} {"current_steps": 20945, "total_steps": 40000, "loss": 0.0661, "lr": 0.13888894806722032, "epoch": 1.023404099381917, "percentage": 52.36, "elapsed_time": "22:05:35", "remaining_time": "20:05:58", "throughput": 333.56, "total_tokens": 26529632} {"current_steps": 20950, "total_steps": 40000, "loss": 0.0676, "lr": 0.1388302058883315, "epoch": 1.023648401045611, "percentage": 52.38, "elapsed_time": "22:05:38", "remaining_time": "20:05:25", "throughput": 333.62, "total_tokens": 26535744} {"current_steps": 20955, "total_steps": 40000, "loss": 0.0476, "lr": 0.13877146543196528, "epoch": 1.0238927027093054, "percentage": 52.39, "elapsed_time": "22:05:41", "remaining_time": "20:04:51", "throughput": 333.69, "total_tokens": 26542080} {"current_steps": 20960, "total_steps": 40000, "loss": 0.0449, "lr": 0.13871272670718027, "epoch": 1.0241370043729998, "percentage": 52.4, "elapsed_time": "22:05:44", "remaining_time": "20:04:18", "throughput": 333.75, "total_tokens": 26548416} {"current_steps": 20965, "total_steps": 40000, "loss": 0.04, "lr": 0.13865398972303455, "epoch": 1.0243813060366942, "percentage": 52.41, "elapsed_time": "22:05:47", "remaining_time": "20:03:44", "throughput": 333.82, "total_tokens": 26554752} {"current_steps": 20970, "total_steps": 40000, "loss": 0.0484, "lr": 0.13859525448858623, "epoch": 1.0246256077003884, "percentage": 52.42, "elapsed_time": "22:05:51", "remaining_time": "20:03:11", "throughput": 333.89, "total_tokens": 26561216} {"current_steps": 20975, "total_steps": 40000, "loss": 0.04, "lr": 0.13853652101289304, "epoch": 1.0248699093640827, "percentage": 52.44, "elapsed_time": "22:05:54", "remaining_time": "20:02:38", "throughput": 333.95, "total_tokens": 26567456} {"current_steps": 20980, "total_steps": 40000, "loss": 0.0617, "lr": 0.13847778930501234, "epoch": 1.0251142110277771, "percentage": 52.45, "elapsed_time": "22:05:57", "remaining_time": "20:02:04", "throughput": 334.02, "total_tokens": 26573664} {"current_steps": 20985, "total_steps": 40000, "loss": 0.1293, "lr": 0.1384190593740013, "epoch": 1.0253585126914715, "percentage": 52.46, "elapsed_time": "22:06:00", "remaining_time": "20:01:31", "throughput": 334.08, "total_tokens": 26579648} {"current_steps": 20990, "total_steps": 40000, "loss": 0.0677, "lr": 0.13836033122891686, "epoch": 1.0256028143551656, "percentage": 52.48, "elapsed_time": "22:06:03", "remaining_time": "20:00:57", "throughput": 334.15, "total_tokens": 26585792} {"current_steps": 20995, "total_steps": 40000, "loss": 0.058, "lr": 0.1383016048788156, "epoch": 1.02584711601886, "percentage": 52.49, "elapsed_time": "22:06:06", "remaining_time": "20:00:24", "throughput": 334.21, "total_tokens": 26592224} {"current_steps": 21000, "total_steps": 40000, "loss": 0.0531, "lr": 0.13824288033275392, "epoch": 1.0260914176825544, "percentage": 52.5, "elapsed_time": "22:06:09", "remaining_time": "19:59:51", "throughput": 334.28, "total_tokens": 26598784} {"current_steps": 21000, "total_steps": 40000, "eval_loss": 0.06586360931396484, "epoch": 1.0260914176825544, "percentage": 52.5, "elapsed_time": "22:16:49", "remaining_time": "20:09:30", "throughput": 331.61, "total_tokens": 26598784} {"current_steps": 21005, "total_steps": 40000, "loss": 0.0734, "lr": 0.1381841575997878, "epoch": 1.0263357193462488, "percentage": 52.51, "elapsed_time": "22:16:53", "remaining_time": "20:08:57", "throughput": 331.68, "total_tokens": 26604992} {"current_steps": 21010, "total_steps": 40000, "loss": 0.0594, "lr": 0.13812543668897306, "epoch": 1.0265800210099432, "percentage": 52.52, "elapsed_time": "22:16:56", "remaining_time": "20:08:24", "throughput": 331.74, "total_tokens": 26610816} {"current_steps": 21015, "total_steps": 40000, "loss": 0.0763, "lr": 0.13806671760936526, "epoch": 1.0268243226736373, "percentage": 52.54, "elapsed_time": "22:16:59", "remaining_time": "20:07:50", "throughput": 331.81, "total_tokens": 26617440} {"current_steps": 21020, "total_steps": 40000, "loss": 0.0721, "lr": 0.13800800037001956, "epoch": 1.0270686243373317, "percentage": 52.55, "elapsed_time": "22:17:02", "remaining_time": "20:07:17", "throughput": 331.87, "total_tokens": 26623808} {"current_steps": 21025, "total_steps": 40000, "loss": 0.0251, "lr": 0.13794928497999087, "epoch": 1.027312926001026, "percentage": 52.56, "elapsed_time": "22:17:06", "remaining_time": "20:06:43", "throughput": 331.94, "total_tokens": 26630016} {"current_steps": 21030, "total_steps": 40000, "loss": 0.0507, "lr": 0.1378905714483339, "epoch": 1.0275572276647205, "percentage": 52.58, "elapsed_time": "22:17:09", "remaining_time": "20:06:10", "throughput": 332.0, "total_tokens": 26636032} {"current_steps": 21035, "total_steps": 40000, "loss": 0.0343, "lr": 0.13783185978410295, "epoch": 1.0278015293284146, "percentage": 52.59, "elapsed_time": "22:17:12", "remaining_time": "20:05:36", "throughput": 332.07, "total_tokens": 26642592} {"current_steps": 21040, "total_steps": 40000, "loss": 0.0537, "lr": 0.13777314999635218, "epoch": 1.028045830992109, "percentage": 52.6, "elapsed_time": "22:17:15", "remaining_time": "20:05:03", "throughput": 332.13, "total_tokens": 26648704} {"current_steps": 21045, "total_steps": 40000, "loss": 0.0677, "lr": 0.1377144420941353, "epoch": 1.0282901326558034, "percentage": 52.61, "elapsed_time": "22:17:18", "remaining_time": "20:04:29", "throughput": 332.2, "total_tokens": 26654848} {"current_steps": 21050, "total_steps": 40000, "loss": 0.081, "lr": 0.13765573608650586, "epoch": 1.0285344343194978, "percentage": 52.62, "elapsed_time": "22:17:21", "remaining_time": "20:03:56", "throughput": 332.27, "total_tokens": 26661504} {"current_steps": 21055, "total_steps": 40000, "loss": 0.0655, "lr": 0.13759703198251702, "epoch": 1.0287787359831921, "percentage": 52.64, "elapsed_time": "22:17:24", "remaining_time": "20:03:22", "throughput": 332.33, "total_tokens": 26667808} {"current_steps": 21060, "total_steps": 40000, "loss": 0.0761, "lr": 0.13753832979122174, "epoch": 1.0290230376468863, "percentage": 52.65, "elapsed_time": "22:17:27", "remaining_time": "20:02:49", "throughput": 332.4, "total_tokens": 26674496} {"current_steps": 21065, "total_steps": 40000, "loss": 0.0453, "lr": 0.13747962952167264, "epoch": 1.0292673393105807, "percentage": 52.66, "elapsed_time": "22:17:30", "remaining_time": "20:02:16", "throughput": 332.47, "total_tokens": 26680768} {"current_steps": 21070, "total_steps": 40000, "loss": 0.0832, "lr": 0.13742093118292192, "epoch": 1.029511640974275, "percentage": 52.68, "elapsed_time": "22:17:34", "remaining_time": "20:01:43", "throughput": 332.54, "total_tokens": 26687424} {"current_steps": 21075, "total_steps": 40000, "loss": 0.0652, "lr": 0.13736223478402174, "epoch": 1.0297559426379694, "percentage": 52.69, "elapsed_time": "22:17:37", "remaining_time": "20:01:09", "throughput": 332.6, "total_tokens": 26693728} {"current_steps": 21080, "total_steps": 40000, "loss": 0.0569, "lr": 0.1373035403340238, "epoch": 1.0300002443016636, "percentage": 52.7, "elapsed_time": "22:17:40", "remaining_time": "20:00:36", "throughput": 332.66, "total_tokens": 26699744} {"current_steps": 21085, "total_steps": 40000, "loss": 0.0527, "lr": 0.13724484784197943, "epoch": 1.030244545965358, "percentage": 52.71, "elapsed_time": "22:17:43", "remaining_time": "20:00:02", "throughput": 332.73, "total_tokens": 26706048} {"current_steps": 21090, "total_steps": 40000, "loss": 0.0898, "lr": 0.13718615731693987, "epoch": 1.0304888476290524, "percentage": 52.73, "elapsed_time": "22:17:46", "remaining_time": "19:59:29", "throughput": 332.79, "total_tokens": 26712192} {"current_steps": 21095, "total_steps": 40000, "loss": 0.0614, "lr": 0.13712746876795587, "epoch": 1.0307331492927467, "percentage": 52.74, "elapsed_time": "22:17:49", "remaining_time": "19:58:56", "throughput": 332.86, "total_tokens": 26718304} {"current_steps": 21100, "total_steps": 40000, "loss": 0.0725, "lr": 0.13706878220407792, "epoch": 1.030977450956441, "percentage": 52.75, "elapsed_time": "22:17:52", "remaining_time": "19:58:22", "throughput": 332.92, "total_tokens": 26724608} {"current_steps": 21105, "total_steps": 40000, "loss": 0.0533, "lr": 0.13701009763435631, "epoch": 1.0312217526201353, "percentage": 52.76, "elapsed_time": "22:17:55", "remaining_time": "19:57:49", "throughput": 332.99, "total_tokens": 26731360} {"current_steps": 21110, "total_steps": 40000, "loss": 0.087, "lr": 0.13695141506784084, "epoch": 1.0314660542838296, "percentage": 52.78, "elapsed_time": "22:17:58", "remaining_time": "19:57:16", "throughput": 333.06, "total_tokens": 26737856} {"current_steps": 21115, "total_steps": 40000, "loss": 0.0959, "lr": 0.13689273451358114, "epoch": 1.031710355947524, "percentage": 52.79, "elapsed_time": "22:18:01", "remaining_time": "19:56:43", "throughput": 333.13, "total_tokens": 26744512} {"current_steps": 21120, "total_steps": 40000, "loss": 0.0659, "lr": 0.13683405598062653, "epoch": 1.0319546576112184, "percentage": 52.8, "elapsed_time": "22:18:05", "remaining_time": "19:56:09", "throughput": 333.2, "total_tokens": 26751008} {"current_steps": 21125, "total_steps": 40000, "loss": 0.0606, "lr": 0.1367753794780259, "epoch": 1.0321989592749126, "percentage": 52.81, "elapsed_time": "22:18:07", "remaining_time": "19:55:36", "throughput": 333.26, "total_tokens": 26756864} {"current_steps": 21130, "total_steps": 40000, "loss": 0.059, "lr": 0.13671670501482802, "epoch": 1.032443260938607, "percentage": 52.83, "elapsed_time": "22:18:11", "remaining_time": "19:55:03", "throughput": 333.32, "total_tokens": 26762976} {"current_steps": 21135, "total_steps": 40000, "loss": 0.0608, "lr": 0.1366580326000811, "epoch": 1.0326875626023013, "percentage": 52.84, "elapsed_time": "22:18:14", "remaining_time": "19:54:30", "throughput": 333.39, "total_tokens": 26769248} {"current_steps": 21140, "total_steps": 40000, "loss": 0.0605, "lr": 0.1365993622428332, "epoch": 1.0329318642659957, "percentage": 52.85, "elapsed_time": "22:18:17", "remaining_time": "19:53:56", "throughput": 333.46, "total_tokens": 26775648} {"current_steps": 21145, "total_steps": 40000, "loss": 0.0773, "lr": 0.13654069395213211, "epoch": 1.03317616592969, "percentage": 52.86, "elapsed_time": "22:18:20", "remaining_time": "19:53:23", "throughput": 333.52, "total_tokens": 26781696} {"current_steps": 21150, "total_steps": 40000, "loss": 0.0567, "lr": 0.13648202773702509, "epoch": 1.0334204675933842, "percentage": 52.88, "elapsed_time": "22:18:23", "remaining_time": "19:52:50", "throughput": 333.59, "total_tokens": 26788288} {"current_steps": 21155, "total_steps": 40000, "loss": 0.0498, "lr": 0.13642336360655927, "epoch": 1.0336647692570786, "percentage": 52.89, "elapsed_time": "22:18:26", "remaining_time": "19:52:17", "throughput": 333.65, "total_tokens": 26794240} {"current_steps": 21160, "total_steps": 40000, "loss": 0.0689, "lr": 0.13636470156978145, "epoch": 1.033909070920773, "percentage": 52.9, "elapsed_time": "22:18:29", "remaining_time": "19:51:44", "throughput": 333.72, "total_tokens": 26800416} {"current_steps": 21165, "total_steps": 40000, "loss": 0.065, "lr": 0.13630604163573798, "epoch": 1.0341533725844674, "percentage": 52.91, "elapsed_time": "22:18:32", "remaining_time": "19:51:10", "throughput": 333.78, "total_tokens": 26806784} {"current_steps": 21170, "total_steps": 40000, "loss": 0.0623, "lr": 0.13624738381347495, "epoch": 1.0343976742481615, "percentage": 52.92, "elapsed_time": "22:18:35", "remaining_time": "19:50:37", "throughput": 333.85, "total_tokens": 26812896} {"current_steps": 21175, "total_steps": 40000, "loss": 0.0478, "lr": 0.1361887281120382, "epoch": 1.034641975911856, "percentage": 52.94, "elapsed_time": "22:18:38", "remaining_time": "19:50:04", "throughput": 333.91, "total_tokens": 26819232} {"current_steps": 21180, "total_steps": 40000, "loss": 0.0545, "lr": 0.13613007454047307, "epoch": 1.0348862775755503, "percentage": 52.95, "elapsed_time": "22:18:41", "remaining_time": "19:49:31", "throughput": 333.98, "total_tokens": 26825504} {"current_steps": 21185, "total_steps": 40000, "loss": 0.0549, "lr": 0.13607142310782486, "epoch": 1.0351305792392447, "percentage": 52.96, "elapsed_time": "22:18:44", "remaining_time": "19:48:58", "throughput": 334.05, "total_tokens": 26832480} {"current_steps": 21190, "total_steps": 40000, "loss": 0.0272, "lr": 0.13601277382313814, "epoch": 1.035374880902939, "percentage": 52.98, "elapsed_time": "22:18:47", "remaining_time": "19:48:25", "throughput": 334.12, "total_tokens": 26838944} {"current_steps": 21195, "total_steps": 40000, "loss": 0.0549, "lr": 0.1359541266954575, "epoch": 1.0356191825666332, "percentage": 52.99, "elapsed_time": "22:18:50", "remaining_time": "19:47:52", "throughput": 334.18, "total_tokens": 26845280} {"current_steps": 21200, "total_steps": 40000, "loss": 0.032, "lr": 0.13589548173382707, "epoch": 1.0358634842303276, "percentage": 53.0, "elapsed_time": "22:18:53", "remaining_time": "19:47:19", "throughput": 334.25, "total_tokens": 26851648} {"current_steps": 21200, "total_steps": 40000, "eval_loss": 0.06693243980407715, "epoch": 1.0358634842303276, "percentage": 53.0, "elapsed_time": "22:29:34", "remaining_time": "19:56:47", "throughput": 331.61, "total_tokens": 26851648} {"current_steps": 21205, "total_steps": 40000, "loss": 0.0597, "lr": 0.1358368389472906, "epoch": 1.036107785894022, "percentage": 53.01, "elapsed_time": "22:29:38", "remaining_time": "19:56:14", "throughput": 331.66, "total_tokens": 26857344} {"current_steps": 21210, "total_steps": 40000, "loss": 0.0634, "lr": 0.13577819834489155, "epoch": 1.0363520875577164, "percentage": 53.02, "elapsed_time": "22:29:41", "remaining_time": "19:55:41", "throughput": 331.73, "total_tokens": 26863680} {"current_steps": 21215, "total_steps": 40000, "loss": 0.0589, "lr": 0.135719559935673, "epoch": 1.0365963892214105, "percentage": 53.04, "elapsed_time": "22:29:44", "remaining_time": "19:55:08", "throughput": 331.79, "total_tokens": 26869856} {"current_steps": 21220, "total_steps": 40000, "loss": 0.0542, "lr": 0.13566092372867775, "epoch": 1.0368406908851049, "percentage": 53.05, "elapsed_time": "22:29:47", "remaining_time": "19:54:35", "throughput": 331.86, "total_tokens": 26876384} {"current_steps": 21225, "total_steps": 40000, "loss": 0.0726, "lr": 0.13560228973294833, "epoch": 1.0370849925487993, "percentage": 53.06, "elapsed_time": "22:29:50", "remaining_time": "19:54:01", "throughput": 331.92, "total_tokens": 26882272} {"current_steps": 21230, "total_steps": 40000, "loss": 0.0486, "lr": 0.13554365795752668, "epoch": 1.0373292942124936, "percentage": 53.08, "elapsed_time": "22:29:53", "remaining_time": "19:53:28", "throughput": 331.99, "total_tokens": 26889056} {"current_steps": 21235, "total_steps": 40000, "loss": 0.0384, "lr": 0.1354850284114547, "epoch": 1.037573595876188, "percentage": 53.09, "elapsed_time": "22:29:56", "remaining_time": "19:52:55", "throughput": 332.06, "total_tokens": 26895392} {"current_steps": 21240, "total_steps": 40000, "loss": 0.062, "lr": 0.13542640110377374, "epoch": 1.0378178975398822, "percentage": 53.1, "elapsed_time": "22:29:59", "remaining_time": "19:52:22", "throughput": 332.12, "total_tokens": 26901824} {"current_steps": 21245, "total_steps": 40000, "loss": 0.0811, "lr": 0.13536777604352487, "epoch": 1.0380621992035766, "percentage": 53.11, "elapsed_time": "22:30:02", "remaining_time": "19:51:48", "throughput": 332.19, "total_tokens": 26908032} {"current_steps": 21250, "total_steps": 40000, "loss": 0.0875, "lr": 0.13530915323974887, "epoch": 1.038306500867271, "percentage": 53.12, "elapsed_time": "22:30:05", "remaining_time": "19:51:15", "throughput": 332.25, "total_tokens": 26914368} {"current_steps": 21255, "total_steps": 40000, "loss": 0.0579, "lr": 0.13525053270148596, "epoch": 1.0385508025309653, "percentage": 53.14, "elapsed_time": "22:30:08", "remaining_time": "19:50:42", "throughput": 332.32, "total_tokens": 26920512} {"current_steps": 21260, "total_steps": 40000, "loss": 0.0532, "lr": 0.13519191443777628, "epoch": 1.0387951041946595, "percentage": 53.15, "elapsed_time": "22:30:12", "remaining_time": "19:50:09", "throughput": 332.38, "total_tokens": 26926688} {"current_steps": 21265, "total_steps": 40000, "loss": 0.0465, "lr": 0.13513329845765953, "epoch": 1.0390394058583539, "percentage": 53.16, "elapsed_time": "22:30:15", "remaining_time": "19:49:36", "throughput": 332.45, "total_tokens": 26933280} {"current_steps": 21270, "total_steps": 40000, "loss": 0.0611, "lr": 0.13507468477017495, "epoch": 1.0392837075220482, "percentage": 53.17, "elapsed_time": "22:30:18", "remaining_time": "19:49:03", "throughput": 332.51, "total_tokens": 26939520} {"current_steps": 21275, "total_steps": 40000, "loss": 0.0468, "lr": 0.13501607338436153, "epoch": 1.0395280091857426, "percentage": 53.19, "elapsed_time": "22:30:21", "remaining_time": "19:48:30", "throughput": 332.58, "total_tokens": 26945888} {"current_steps": 21280, "total_steps": 40000, "loss": 0.0377, "lr": 0.13495746430925798, "epoch": 1.039772310849437, "percentage": 53.2, "elapsed_time": "22:30:24", "remaining_time": "19:47:57", "throughput": 332.64, "total_tokens": 26952032} {"current_steps": 21285, "total_steps": 40000, "loss": 0.0534, "lr": 0.13489885755390238, "epoch": 1.0400166125131312, "percentage": 53.21, "elapsed_time": "22:30:27", "remaining_time": "19:47:23", "throughput": 332.71, "total_tokens": 26958656} {"current_steps": 21290, "total_steps": 40000, "loss": 0.0474, "lr": 0.13484025312733275, "epoch": 1.0402609141768255, "percentage": 53.23, "elapsed_time": "22:30:30", "remaining_time": "19:46:50", "throughput": 332.78, "total_tokens": 26964992} {"current_steps": 21295, "total_steps": 40000, "loss": 0.0411, "lr": 0.13478165103858658, "epoch": 1.04050521584052, "percentage": 53.24, "elapsed_time": "22:30:33", "remaining_time": "19:46:18", "throughput": 332.85, "total_tokens": 26971744} {"current_steps": 21300, "total_steps": 40000, "loss": 0.0757, "lr": 0.13472305129670106, "epoch": 1.0407495175042143, "percentage": 53.25, "elapsed_time": "22:30:36", "remaining_time": "19:45:45", "throughput": 332.91, "total_tokens": 26978112} {"current_steps": 21305, "total_steps": 40000, "loss": 0.0485, "lr": 0.13466445391071305, "epoch": 1.0409938191679085, "percentage": 53.26, "elapsed_time": "22:30:39", "remaining_time": "19:45:11", "throughput": 332.97, "total_tokens": 26984096} {"current_steps": 21310, "total_steps": 40000, "loss": 0.0667, "lr": 0.13460585888965895, "epoch": 1.0412381208316028, "percentage": 53.27, "elapsed_time": "22:30:42", "remaining_time": "19:44:38", "throughput": 333.03, "total_tokens": 26990016} {"current_steps": 21315, "total_steps": 40000, "loss": 0.0601, "lr": 0.13454726624257482, "epoch": 1.0414824224952972, "percentage": 53.29, "elapsed_time": "22:30:45", "remaining_time": "19:44:05", "throughput": 333.1, "total_tokens": 26996608} {"current_steps": 21320, "total_steps": 40000, "loss": 0.0497, "lr": 0.1344886759784965, "epoch": 1.0417267241589916, "percentage": 53.3, "elapsed_time": "22:30:49", "remaining_time": "19:43:33", "throughput": 333.17, "total_tokens": 27003168} {"current_steps": 21325, "total_steps": 40000, "loss": 0.101, "lr": 0.13443008810645923, "epoch": 1.0419710258226857, "percentage": 53.31, "elapsed_time": "22:30:52", "remaining_time": "19:42:59", "throughput": 333.23, "total_tokens": 27008992} {"current_steps": 21330, "total_steps": 40000, "loss": 0.0651, "lr": 0.13437150263549807, "epoch": 1.0422153274863801, "percentage": 53.33, "elapsed_time": "22:30:55", "remaining_time": "19:42:27", "throughput": 333.3, "total_tokens": 27015520} {"current_steps": 21335, "total_steps": 40000, "loss": 0.0446, "lr": 0.13431291957464755, "epoch": 1.0424596291500745, "percentage": 53.34, "elapsed_time": "22:30:58", "remaining_time": "19:41:54", "throughput": 333.36, "total_tokens": 27021760} {"current_steps": 21340, "total_steps": 40000, "loss": 0.0362, "lr": 0.13425433893294197, "epoch": 1.0427039308137689, "percentage": 53.35, "elapsed_time": "22:31:01", "remaining_time": "19:41:21", "throughput": 333.43, "total_tokens": 27028512} {"current_steps": 21345, "total_steps": 40000, "loss": 0.0614, "lr": 0.13419576071941525, "epoch": 1.0429482324774633, "percentage": 53.36, "elapsed_time": "22:31:04", "remaining_time": "19:40:48", "throughput": 333.49, "total_tokens": 27034528} {"current_steps": 21350, "total_steps": 40000, "loss": 0.0679, "lr": 0.1341371849431008, "epoch": 1.0431925341411574, "percentage": 53.37, "elapsed_time": "22:31:07", "remaining_time": "19:40:15", "throughput": 333.56, "total_tokens": 27040992} {"current_steps": 21355, "total_steps": 40000, "loss": 0.0462, "lr": 0.13407861161303178, "epoch": 1.0434368358048518, "percentage": 53.39, "elapsed_time": "22:31:10", "remaining_time": "19:39:42", "throughput": 333.63, "total_tokens": 27047360} {"current_steps": 21360, "total_steps": 40000, "loss": 0.0591, "lr": 0.13402004073824098, "epoch": 1.0436811374685462, "percentage": 53.4, "elapsed_time": "22:31:13", "remaining_time": "19:39:09", "throughput": 333.69, "total_tokens": 27053600} {"current_steps": 21365, "total_steps": 40000, "loss": 0.0823, "lr": 0.13396147232776062, "epoch": 1.0439254391322406, "percentage": 53.41, "elapsed_time": "22:31:16", "remaining_time": "19:38:36", "throughput": 333.75, "total_tokens": 27059744} {"current_steps": 21370, "total_steps": 40000, "loss": 0.0499, "lr": 0.13390290639062288, "epoch": 1.0441697407959347, "percentage": 53.42, "elapsed_time": "22:31:19", "remaining_time": "19:38:04", "throughput": 333.82, "total_tokens": 27066400} {"current_steps": 21375, "total_steps": 40000, "loss": 0.0604, "lr": 0.13384434293585917, "epoch": 1.044414042459629, "percentage": 53.44, "elapsed_time": "22:31:22", "remaining_time": "19:37:31", "throughput": 333.88, "total_tokens": 27072192} {"current_steps": 21380, "total_steps": 40000, "loss": 0.0783, "lr": 0.13378578197250088, "epoch": 1.0446583441233235, "percentage": 53.45, "elapsed_time": "22:31:26", "remaining_time": "19:36:58", "throughput": 333.95, "total_tokens": 27078592} {"current_steps": 21385, "total_steps": 40000, "loss": 0.0936, "lr": 0.13372722350957872, "epoch": 1.0449026457870179, "percentage": 53.46, "elapsed_time": "22:31:29", "remaining_time": "19:36:25", "throughput": 334.02, "total_tokens": 27085024} {"current_steps": 21390, "total_steps": 40000, "loss": 0.0679, "lr": 0.13366866755612322, "epoch": 1.0451469474507122, "percentage": 53.47, "elapsed_time": "22:31:32", "remaining_time": "19:35:52", "throughput": 334.08, "total_tokens": 27091008} {"current_steps": 21395, "total_steps": 40000, "loss": 0.0393, "lr": 0.13361011412116436, "epoch": 1.0453912491144064, "percentage": 53.49, "elapsed_time": "22:31:35", "remaining_time": "19:35:20", "throughput": 334.14, "total_tokens": 27097184} {"current_steps": 21400, "total_steps": 40000, "loss": 0.0714, "lr": 0.13355156321373196, "epoch": 1.0456355507781008, "percentage": 53.5, "elapsed_time": "22:31:38", "remaining_time": "19:34:47", "throughput": 334.2, "total_tokens": 27103392} {"current_steps": 21400, "total_steps": 40000, "eval_loss": 0.06473684310913086, "epoch": 1.0456355507781008, "percentage": 53.5, "elapsed_time": "22:42:18", "remaining_time": "19:44:03", "throughput": 331.59, "total_tokens": 27103392} {"current_steps": 21405, "total_steps": 40000, "loss": 0.0444, "lr": 0.13349301484285514, "epoch": 1.0458798524417952, "percentage": 53.51, "elapsed_time": "22:42:22", "remaining_time": "19:43:31", "throughput": 331.65, "total_tokens": 27109888} {"current_steps": 21410, "total_steps": 40000, "loss": 0.055, "lr": 0.13343446901756295, "epoch": 1.0461241541054895, "percentage": 53.52, "elapsed_time": "22:42:25", "remaining_time": "19:42:58", "throughput": 331.72, "total_tokens": 27116480} {"current_steps": 21415, "total_steps": 40000, "loss": 0.0618, "lr": 0.13337592574688376, "epoch": 1.0463684557691837, "percentage": 53.54, "elapsed_time": "22:42:28", "remaining_time": "19:42:25", "throughput": 331.78, "total_tokens": 27122816} {"current_steps": 21420, "total_steps": 40000, "loss": 0.0625, "lr": 0.13331738503984572, "epoch": 1.046612757432878, "percentage": 53.55, "elapsed_time": "22:42:31", "remaining_time": "19:41:52", "throughput": 331.85, "total_tokens": 27129056} {"current_steps": 21425, "total_steps": 40000, "loss": 0.0315, "lr": 0.1332588469054766, "epoch": 1.0468570590965725, "percentage": 53.56, "elapsed_time": "22:42:35", "remaining_time": "19:41:19", "throughput": 331.91, "total_tokens": 27135456} {"current_steps": 21430, "total_steps": 40000, "loss": 0.0572, "lr": 0.1332003113528036, "epoch": 1.0471013607602668, "percentage": 53.57, "elapsed_time": "22:42:38", "remaining_time": "19:40:46", "throughput": 331.97, "total_tokens": 27141536} {"current_steps": 21435, "total_steps": 40000, "loss": 0.0553, "lr": 0.13314177839085373, "epoch": 1.0473456624239612, "percentage": 53.59, "elapsed_time": "22:42:41", "remaining_time": "19:40:13", "throughput": 332.04, "total_tokens": 27147616} {"current_steps": 21440, "total_steps": 40000, "loss": 0.0726, "lr": 0.13308324802865354, "epoch": 1.0475899640876554, "percentage": 53.6, "elapsed_time": "22:42:44", "remaining_time": "19:39:40", "throughput": 332.1, "total_tokens": 27154176} {"current_steps": 21445, "total_steps": 40000, "loss": 0.04, "lr": 0.13302472027522905, "epoch": 1.0478342657513497, "percentage": 53.61, "elapsed_time": "22:42:47", "remaining_time": "19:39:08", "throughput": 332.17, "total_tokens": 27160800} {"current_steps": 21450, "total_steps": 40000, "loss": 0.0552, "lr": 0.13296619513960606, "epoch": 1.0480785674150441, "percentage": 53.62, "elapsed_time": "22:42:50", "remaining_time": "19:38:35", "throughput": 332.24, "total_tokens": 27167200} {"current_steps": 21455, "total_steps": 40000, "loss": 0.0657, "lr": 0.1329076726308098, "epoch": 1.0483228690787385, "percentage": 53.64, "elapsed_time": "22:42:53", "remaining_time": "19:38:02", "throughput": 332.3, "total_tokens": 27173472} {"current_steps": 21460, "total_steps": 40000, "loss": 0.0789, "lr": 0.13284915275786519, "epoch": 1.0485671707424327, "percentage": 53.65, "elapsed_time": "22:42:56", "remaining_time": "19:37:29", "throughput": 332.37, "total_tokens": 27180032} {"current_steps": 21465, "total_steps": 40000, "loss": 0.0509, "lr": 0.1327906355297968, "epoch": 1.048811472406127, "percentage": 53.66, "elapsed_time": "22:42:59", "remaining_time": "19:36:56", "throughput": 332.44, "total_tokens": 27186528} {"current_steps": 21470, "total_steps": 40000, "loss": 0.0711, "lr": 0.13273212095562867, "epoch": 1.0490557740698214, "percentage": 53.67, "elapsed_time": "22:43:02", "remaining_time": "19:36:23", "throughput": 332.5, "total_tokens": 27192864} {"current_steps": 21475, "total_steps": 40000, "loss": 0.0348, "lr": 0.13267360904438444, "epoch": 1.0493000757335158, "percentage": 53.69, "elapsed_time": "22:43:06", "remaining_time": "19:35:51", "throughput": 332.57, "total_tokens": 27199328} {"current_steps": 21480, "total_steps": 40000, "loss": 0.0432, "lr": 0.1326150998050875, "epoch": 1.0495443773972102, "percentage": 53.7, "elapsed_time": "22:43:09", "remaining_time": "19:35:18", "throughput": 332.63, "total_tokens": 27205600} {"current_steps": 21485, "total_steps": 40000, "loss": 0.0567, "lr": 0.1325565932467606, "epoch": 1.0497886790609043, "percentage": 53.71, "elapsed_time": "22:43:12", "remaining_time": "19:34:45", "throughput": 332.7, "total_tokens": 27212384} {"current_steps": 21490, "total_steps": 40000, "loss": 0.0935, "lr": 0.13249808937842628, "epoch": 1.0500329807245987, "percentage": 53.73, "elapsed_time": "22:43:15", "remaining_time": "19:34:12", "throughput": 332.77, "total_tokens": 27218720} {"current_steps": 21495, "total_steps": 40000, "loss": 0.0593, "lr": 0.1324395882091065, "epoch": 1.050277282388293, "percentage": 53.74, "elapsed_time": "22:43:18", "remaining_time": "19:33:40", "throughput": 332.83, "total_tokens": 27225056} {"current_steps": 21500, "total_steps": 40000, "loss": 0.0419, "lr": 0.13238108974782284, "epoch": 1.0505215840519875, "percentage": 53.75, "elapsed_time": "22:43:21", "remaining_time": "19:33:07", "throughput": 332.89, "total_tokens": 27231264} {"current_steps": 21505, "total_steps": 40000, "loss": 0.0429, "lr": 0.13232259400359664, "epoch": 1.0507658857156816, "percentage": 53.76, "elapsed_time": "22:43:24", "remaining_time": "19:32:34", "throughput": 332.96, "total_tokens": 27237984} {"current_steps": 21510, "total_steps": 40000, "loss": 0.0872, "lr": 0.13226410098544852, "epoch": 1.051010187379376, "percentage": 53.77, "elapsed_time": "22:43:27", "remaining_time": "19:32:02", "throughput": 333.04, "total_tokens": 27245280} {"current_steps": 21515, "total_steps": 40000, "loss": 0.066, "lr": 0.13220561070239892, "epoch": 1.0512544890430704, "percentage": 53.79, "elapsed_time": "22:43:31", "remaining_time": "19:31:29", "throughput": 333.11, "total_tokens": 27252064} {"current_steps": 21520, "total_steps": 40000, "loss": 0.0508, "lr": 0.13214712316346783, "epoch": 1.0514987907067648, "percentage": 53.8, "elapsed_time": "22:43:34", "remaining_time": "19:30:56", "throughput": 333.18, "total_tokens": 27258656} {"current_steps": 21525, "total_steps": 40000, "loss": 0.0863, "lr": 0.13208863837767465, "epoch": 1.051743092370459, "percentage": 53.81, "elapsed_time": "22:43:37", "remaining_time": "19:30:24", "throughput": 333.24, "total_tokens": 27264768} {"current_steps": 21530, "total_steps": 40000, "loss": 0.0352, "lr": 0.13203015635403856, "epoch": 1.0519873940341533, "percentage": 53.83, "elapsed_time": "22:43:40", "remaining_time": "19:29:51", "throughput": 333.3, "total_tokens": 27270816} {"current_steps": 21535, "total_steps": 40000, "loss": 0.06, "lr": 0.13197167710157817, "epoch": 1.0522316956978477, "percentage": 53.84, "elapsed_time": "22:43:43", "remaining_time": "19:29:18", "throughput": 333.37, "total_tokens": 27277376} {"current_steps": 21540, "total_steps": 40000, "loss": 0.0607, "lr": 0.13191320062931167, "epoch": 1.052475997361542, "percentage": 53.85, "elapsed_time": "22:43:46", "remaining_time": "19:28:46", "throughput": 333.44, "total_tokens": 27284448} {"current_steps": 21545, "total_steps": 40000, "loss": 0.0575, "lr": 0.13185472694625702, "epoch": 1.0527202990252365, "percentage": 53.86, "elapsed_time": "22:43:49", "remaining_time": "19:28:13", "throughput": 333.51, "total_tokens": 27290624} {"current_steps": 21550, "total_steps": 40000, "loss": 0.0434, "lr": 0.13179625606143142, "epoch": 1.0529646006889306, "percentage": 53.87, "elapsed_time": "22:43:52", "remaining_time": "19:27:41", "throughput": 333.57, "total_tokens": 27297088} {"current_steps": 21555, "total_steps": 40000, "loss": 0.0877, "lr": 0.13173778798385188, "epoch": 1.053208902352625, "percentage": 53.89, "elapsed_time": "22:43:55", "remaining_time": "19:27:08", "throughput": 333.64, "total_tokens": 27303360} {"current_steps": 21560, "total_steps": 40000, "loss": 0.0545, "lr": 0.13167932272253505, "epoch": 1.0534532040163194, "percentage": 53.9, "elapsed_time": "22:43:59", "remaining_time": "19:26:35", "throughput": 333.7, "total_tokens": 27309792} {"current_steps": 21565, "total_steps": 40000, "loss": 0.0584, "lr": 0.1316208602864968, "epoch": 1.0536975056800137, "percentage": 53.91, "elapsed_time": "22:44:02", "remaining_time": "19:26:03", "throughput": 333.77, "total_tokens": 27316320} {"current_steps": 21570, "total_steps": 40000, "loss": 0.0476, "lr": 0.13156240068475292, "epoch": 1.053941807343708, "percentage": 53.92, "elapsed_time": "22:44:05", "remaining_time": "19:25:30", "throughput": 333.83, "total_tokens": 27322624} {"current_steps": 21575, "total_steps": 40000, "loss": 0.0613, "lr": 0.1315039439263185, "epoch": 1.0541861090074023, "percentage": 53.94, "elapsed_time": "22:44:08", "remaining_time": "19:24:58", "throughput": 333.9, "total_tokens": 27328768} {"current_steps": 21580, "total_steps": 40000, "loss": 0.0497, "lr": 0.13144549002020833, "epoch": 1.0544304106710967, "percentage": 53.95, "elapsed_time": "22:44:11", "remaining_time": "19:24:25", "throughput": 333.96, "total_tokens": 27334688} {"current_steps": 21585, "total_steps": 40000, "loss": 0.0417, "lr": 0.13138703897543688, "epoch": 1.054674712334791, "percentage": 53.96, "elapsed_time": "22:44:14", "remaining_time": "19:23:53", "throughput": 334.02, "total_tokens": 27341088} {"current_steps": 21590, "total_steps": 40000, "loss": 0.0442, "lr": 0.1313285908010178, "epoch": 1.0549190139984854, "percentage": 53.97, "elapsed_time": "22:44:17", "remaining_time": "19:23:20", "throughput": 334.09, "total_tokens": 27347840} {"current_steps": 21595, "total_steps": 40000, "loss": 0.0873, "lr": 0.13127014550596475, "epoch": 1.0551633156621796, "percentage": 53.99, "elapsed_time": "22:44:20", "remaining_time": "19:22:48", "throughput": 334.16, "total_tokens": 27354240} {"current_steps": 21600, "total_steps": 40000, "loss": 0.0601, "lr": 0.1312117030992906, "epoch": 1.055407617325874, "percentage": 54.0, "elapsed_time": "22:44:24", "remaining_time": "19:22:16", "throughput": 334.23, "total_tokens": 27361312} {"current_steps": 21600, "total_steps": 40000, "eval_loss": 0.06503776460886002, "epoch": 1.055407617325874, "percentage": 54.0, "elapsed_time": "22:55:04", "remaining_time": "19:31:21", "throughput": 331.63, "total_tokens": 27361312} {"current_steps": 21605, "total_steps": 40000, "loss": 0.0646, "lr": 0.13115326359000795, "epoch": 1.0556519189895683, "percentage": 54.01, "elapsed_time": "22:55:08", "remaining_time": "19:30:49", "throughput": 331.7, "total_tokens": 27367968} {"current_steps": 21610, "total_steps": 40000, "loss": 0.0647, "lr": 0.13109482698712896, "epoch": 1.0558962206532627, "percentage": 54.02, "elapsed_time": "22:55:11", "remaining_time": "19:30:16", "throughput": 331.77, "total_tokens": 27374592} {"current_steps": 21615, "total_steps": 40000, "loss": 0.0601, "lr": 0.1310363932996651, "epoch": 1.0561405223169569, "percentage": 54.04, "elapsed_time": "22:55:14", "remaining_time": "19:29:44", "throughput": 331.83, "total_tokens": 27380640} {"current_steps": 21620, "total_steps": 40000, "loss": 0.0584, "lr": 0.13097796253662775, "epoch": 1.0563848239806513, "percentage": 54.05, "elapsed_time": "22:55:17", "remaining_time": "19:29:11", "throughput": 331.89, "total_tokens": 27386816} {"current_steps": 21625, "total_steps": 40000, "loss": 0.0656, "lr": 0.1309195347070277, "epoch": 1.0566291256443456, "percentage": 54.06, "elapsed_time": "22:55:20", "remaining_time": "19:28:38", "throughput": 331.96, "total_tokens": 27393824} {"current_steps": 21630, "total_steps": 40000, "loss": 0.0519, "lr": 0.13086110981987506, "epoch": 1.05687342730804, "percentage": 54.07, "elapsed_time": "22:55:24", "remaining_time": "19:28:06", "throughput": 332.03, "total_tokens": 27400320} {"current_steps": 21635, "total_steps": 40000, "loss": 0.0713, "lr": 0.13080268788417987, "epoch": 1.0571177289717344, "percentage": 54.09, "elapsed_time": "22:55:27", "remaining_time": "19:27:33", "throughput": 332.09, "total_tokens": 27406432} {"current_steps": 21640, "total_steps": 40000, "loss": 0.0394, "lr": 0.1307442689089515, "epoch": 1.0573620306354286, "percentage": 54.1, "elapsed_time": "22:55:30", "remaining_time": "19:27:00", "throughput": 332.15, "total_tokens": 27412736} {"current_steps": 21645, "total_steps": 40000, "loss": 0.0549, "lr": 0.13068585290319873, "epoch": 1.057606332299123, "percentage": 54.11, "elapsed_time": "22:55:33", "remaining_time": "19:26:28", "throughput": 332.23, "total_tokens": 27419744} {"current_steps": 21650, "total_steps": 40000, "loss": 0.0658, "lr": 0.13062743987593026, "epoch": 1.0578506339628173, "percentage": 54.12, "elapsed_time": "22:55:36", "remaining_time": "19:25:55", "throughput": 332.28, "total_tokens": 27425536} {"current_steps": 21655, "total_steps": 40000, "loss": 0.0567, "lr": 0.13056902983615395, "epoch": 1.0580949356265117, "percentage": 54.14, "elapsed_time": "22:55:39", "remaining_time": "19:25:23", "throughput": 332.35, "total_tokens": 27431904} {"current_steps": 21660, "total_steps": 40000, "loss": 0.0697, "lr": 0.13051062279287742, "epoch": 1.0583392372902058, "percentage": 54.15, "elapsed_time": "22:55:42", "remaining_time": "19:24:50", "throughput": 332.42, "total_tokens": 27438560} {"current_steps": 21665, "total_steps": 40000, "loss": 0.056, "lr": 0.13045221875510782, "epoch": 1.0585835389539002, "percentage": 54.16, "elapsed_time": "22:55:45", "remaining_time": "19:24:18", "throughput": 332.48, "total_tokens": 27444448} {"current_steps": 21670, "total_steps": 40000, "loss": 0.0482, "lr": 0.13039381773185174, "epoch": 1.0588278406175946, "percentage": 54.17, "elapsed_time": "22:55:48", "remaining_time": "19:23:45", "throughput": 332.54, "total_tokens": 27450848} {"current_steps": 21675, "total_steps": 40000, "loss": 0.08, "lr": 0.1303354197321153, "epoch": 1.059072142281289, "percentage": 54.19, "elapsed_time": "22:55:51", "remaining_time": "19:23:12", "throughput": 332.61, "total_tokens": 27457152} {"current_steps": 21680, "total_steps": 40000, "loss": 0.0565, "lr": 0.13027702476490433, "epoch": 1.0593164439449834, "percentage": 54.2, "elapsed_time": "22:55:54", "remaining_time": "19:22:40", "throughput": 332.67, "total_tokens": 27463552} {"current_steps": 21685, "total_steps": 40000, "loss": 0.0542, "lr": 0.1302186328392239, "epoch": 1.0595607456086775, "percentage": 54.21, "elapsed_time": "22:55:57", "remaining_time": "19:22:07", "throughput": 332.73, "total_tokens": 27469696} {"current_steps": 21690, "total_steps": 40000, "loss": 0.0327, "lr": 0.130160243964079, "epoch": 1.059805047272372, "percentage": 54.23, "elapsed_time": "22:56:01", "remaining_time": "19:21:35", "throughput": 332.8, "total_tokens": 27476544} {"current_steps": 21695, "total_steps": 40000, "loss": 0.072, "lr": 0.13010185814847372, "epoch": 1.0600493489360663, "percentage": 54.24, "elapsed_time": "22:56:04", "remaining_time": "19:21:02", "throughput": 332.87, "total_tokens": 27482848} {"current_steps": 21700, "total_steps": 40000, "loss": 0.0598, "lr": 0.13004347540141192, "epoch": 1.0602936505997607, "percentage": 54.25, "elapsed_time": "22:56:07", "remaining_time": "19:20:30", "throughput": 332.93, "total_tokens": 27489536} {"current_steps": 21705, "total_steps": 40000, "loss": 0.0532, "lr": 0.12998509573189712, "epoch": 1.0605379522634548, "percentage": 54.26, "elapsed_time": "22:56:10", "remaining_time": "19:19:58", "throughput": 333.0, "total_tokens": 27495680} {"current_steps": 21710, "total_steps": 40000, "loss": 0.0633, "lr": 0.12992671914893203, "epoch": 1.0607822539271492, "percentage": 54.27, "elapsed_time": "22:56:13", "remaining_time": "19:19:25", "throughput": 333.06, "total_tokens": 27501824} {"current_steps": 21715, "total_steps": 40000, "loss": 0.0372, "lr": 0.12986834566151909, "epoch": 1.0610265555908436, "percentage": 54.29, "elapsed_time": "22:56:16", "remaining_time": "19:18:53", "throughput": 333.13, "total_tokens": 27508736} {"current_steps": 21720, "total_steps": 40000, "loss": 0.0392, "lr": 0.12980997527866028, "epoch": 1.061270857254538, "percentage": 54.3, "elapsed_time": "22:56:19", "remaining_time": "19:18:20", "throughput": 333.2, "total_tokens": 27515552} {"current_steps": 21725, "total_steps": 40000, "loss": 0.0523, "lr": 0.12975160800935692, "epoch": 1.0615151589182323, "percentage": 54.31, "elapsed_time": "22:56:22", "remaining_time": "19:17:48", "throughput": 333.27, "total_tokens": 27522368} {"current_steps": 21730, "total_steps": 40000, "loss": 0.0735, "lr": 0.12969324386261016, "epoch": 1.0617594605819265, "percentage": 54.33, "elapsed_time": "22:56:26", "remaining_time": "19:17:16", "throughput": 333.33, "total_tokens": 27528448} {"current_steps": 21735, "total_steps": 40000, "loss": 0.0881, "lr": 0.12963488284742034, "epoch": 1.0620037622456209, "percentage": 54.34, "elapsed_time": "22:56:29", "remaining_time": "19:16:43", "throughput": 333.4, "total_tokens": 27534976} {"current_steps": 21740, "total_steps": 40000, "loss": 0.0293, "lr": 0.12957652497278752, "epoch": 1.0622480639093153, "percentage": 54.35, "elapsed_time": "22:56:32", "remaining_time": "19:16:11", "throughput": 333.46, "total_tokens": 27541472} {"current_steps": 21745, "total_steps": 40000, "loss": 0.0761, "lr": 0.12951817024771117, "epoch": 1.0624923655730096, "percentage": 54.36, "elapsed_time": "22:56:35", "remaining_time": "19:15:39", "throughput": 333.53, "total_tokens": 27547872} {"current_steps": 21750, "total_steps": 40000, "loss": 0.0506, "lr": 0.12945981868119041, "epoch": 1.0627366672367038, "percentage": 54.37, "elapsed_time": "22:56:38", "remaining_time": "19:15:06", "throughput": 333.59, "total_tokens": 27553952} {"current_steps": 21755, "total_steps": 40000, "loss": 0.0577, "lr": 0.12940147028222376, "epoch": 1.0629809689003982, "percentage": 54.39, "elapsed_time": "22:56:41", "remaining_time": "19:14:34", "throughput": 333.65, "total_tokens": 27560288} {"current_steps": 21760, "total_steps": 40000, "loss": 0.0918, "lr": 0.12934312505980916, "epoch": 1.0632252705640926, "percentage": 54.4, "elapsed_time": "22:56:44", "remaining_time": "19:14:02", "throughput": 333.72, "total_tokens": 27566560} {"current_steps": 21765, "total_steps": 40000, "loss": 0.051, "lr": 0.1292847830229443, "epoch": 1.063469572227787, "percentage": 54.41, "elapsed_time": "22:56:47", "remaining_time": "19:13:29", "throughput": 333.78, "total_tokens": 27572640} {"current_steps": 21770, "total_steps": 40000, "loss": 0.0875, "lr": 0.12922644418062626, "epoch": 1.0637138738914813, "percentage": 54.43, "elapsed_time": "22:56:50", "remaining_time": "19:12:57", "throughput": 333.84, "total_tokens": 27579040} {"current_steps": 21775, "total_steps": 40000, "loss": 0.0669, "lr": 0.1291681085418515, "epoch": 1.0639581755551755, "percentage": 54.44, "elapsed_time": "22:56:53", "remaining_time": "19:12:25", "throughput": 333.91, "total_tokens": 27585440} {"current_steps": 21780, "total_steps": 40000, "loss": 0.0769, "lr": 0.12910977611561628, "epoch": 1.0642024772188698, "percentage": 54.45, "elapsed_time": "22:56:56", "remaining_time": "19:11:52", "throughput": 333.98, "total_tokens": 27592000} {"current_steps": 21785, "total_steps": 40000, "loss": 0.0514, "lr": 0.1290514469109161, "epoch": 1.0644467788825642, "percentage": 54.46, "elapsed_time": "22:56:59", "remaining_time": "19:11:20", "throughput": 334.03, "total_tokens": 27597952} {"current_steps": 21790, "total_steps": 40000, "loss": 0.0587, "lr": 0.128993120936746, "epoch": 1.0646910805462586, "percentage": 54.47, "elapsed_time": "22:57:03", "remaining_time": "19:10:48", "throughput": 334.1, "total_tokens": 27604096} {"current_steps": 21795, "total_steps": 40000, "loss": 0.0769, "lr": 0.12893479820210071, "epoch": 1.0649353822099528, "percentage": 54.49, "elapsed_time": "22:57:06", "remaining_time": "19:10:16", "throughput": 334.16, "total_tokens": 27610432} {"current_steps": 21800, "total_steps": 40000, "loss": 0.0791, "lr": 0.1288764787159742, "epoch": 1.0651796838736471, "percentage": 54.5, "elapsed_time": "22:57:09", "remaining_time": "19:09:43", "throughput": 334.22, "total_tokens": 27616640} {"current_steps": 21800, "total_steps": 40000, "eval_loss": 0.0645691305398941, "epoch": 1.0651796838736471, "percentage": 54.5, "elapsed_time": "23:07:49", "remaining_time": "19:18:38", "throughput": 331.65, "total_tokens": 27616640} {"current_steps": 21805, "total_steps": 40000, "loss": 0.0651, "lr": 0.1288181624873601, "epoch": 1.0654239855373415, "percentage": 54.51, "elapsed_time": "23:07:53", "remaining_time": "19:18:06", "throughput": 331.72, "total_tokens": 27623456} {"current_steps": 21810, "total_steps": 40000, "loss": 0.0628, "lr": 0.12875984952525163, "epoch": 1.065668287201036, "percentage": 54.52, "elapsed_time": "23:07:56", "remaining_time": "19:17:34", "throughput": 331.78, "total_tokens": 27629536} {"current_steps": 21815, "total_steps": 40000, "loss": 0.057, "lr": 0.12870153983864122, "epoch": 1.0659125888647303, "percentage": 54.54, "elapsed_time": "23:07:59", "remaining_time": "19:17:01", "throughput": 331.84, "total_tokens": 27635680} {"current_steps": 21820, "total_steps": 40000, "loss": 0.0634, "lr": 0.12864323343652104, "epoch": 1.0661568905284244, "percentage": 54.55, "elapsed_time": "23:08:02", "remaining_time": "19:16:29", "throughput": 331.91, "total_tokens": 27642112} {"current_steps": 21825, "total_steps": 40000, "loss": 0.0708, "lr": 0.12858493032788268, "epoch": 1.0664011921921188, "percentage": 54.56, "elapsed_time": "23:08:05", "remaining_time": "19:15:56", "throughput": 331.98, "total_tokens": 27648800} {"current_steps": 21830, "total_steps": 40000, "loss": 0.0539, "lr": 0.12852663052171714, "epoch": 1.0666454938558132, "percentage": 54.57, "elapsed_time": "23:08:08", "remaining_time": "19:15:24", "throughput": 332.04, "total_tokens": 27654880} {"current_steps": 21835, "total_steps": 40000, "loss": 0.0615, "lr": 0.12846833402701507, "epoch": 1.0668897955195076, "percentage": 54.59, "elapsed_time": "23:08:11", "remaining_time": "19:14:52", "throughput": 332.1, "total_tokens": 27661088} {"current_steps": 21840, "total_steps": 40000, "loss": 0.0522, "lr": 0.12841004085276642, "epoch": 1.0671340971832017, "percentage": 54.6, "elapsed_time": "23:08:14", "remaining_time": "19:14:19", "throughput": 332.17, "total_tokens": 27667712} {"current_steps": 21845, "total_steps": 40000, "loss": 0.041, "lr": 0.12835175100796076, "epoch": 1.0673783988468961, "percentage": 54.61, "elapsed_time": "23:08:17", "remaining_time": "19:13:47", "throughput": 332.23, "total_tokens": 27674240} {"current_steps": 21850, "total_steps": 40000, "loss": 0.0777, "lr": 0.12829346450158724, "epoch": 1.0676227005105905, "percentage": 54.62, "elapsed_time": "23:08:20", "remaining_time": "19:13:15", "throughput": 332.29, "total_tokens": 27680320} {"current_steps": 21855, "total_steps": 40000, "loss": 0.0679, "lr": 0.12823518134263423, "epoch": 1.0678670021742849, "percentage": 54.64, "elapsed_time": "23:08:24", "remaining_time": "19:12:42", "throughput": 332.36, "total_tokens": 27687232} {"current_steps": 21860, "total_steps": 40000, "loss": 0.058, "lr": 0.12817690154008973, "epoch": 1.0681113038379793, "percentage": 54.65, "elapsed_time": "23:08:27", "remaining_time": "19:12:10", "throughput": 332.43, "total_tokens": 27693888} {"current_steps": 21865, "total_steps": 40000, "loss": 0.0474, "lr": 0.12811862510294134, "epoch": 1.0683556055016734, "percentage": 54.66, "elapsed_time": "23:08:30", "remaining_time": "19:11:38", "throughput": 332.49, "total_tokens": 27699936} {"current_steps": 21870, "total_steps": 40000, "loss": 0.0464, "lr": 0.12806035204017585, "epoch": 1.0685999071653678, "percentage": 54.67, "elapsed_time": "23:08:33", "remaining_time": "19:11:05", "throughput": 332.55, "total_tokens": 27705824} {"current_steps": 21875, "total_steps": 40000, "loss": 0.0512, "lr": 0.12800208236077987, "epoch": 1.0688442088290622, "percentage": 54.69, "elapsed_time": "23:08:36", "remaining_time": "19:10:33", "throughput": 332.61, "total_tokens": 27712128} {"current_steps": 21880, "total_steps": 40000, "loss": 0.0604, "lr": 0.12794381607373917, "epoch": 1.0690885104927565, "percentage": 54.7, "elapsed_time": "23:08:39", "remaining_time": "19:10:01", "throughput": 332.68, "total_tokens": 27718496} {"current_steps": 21885, "total_steps": 40000, "loss": 0.0686, "lr": 0.12788555318803924, "epoch": 1.0693328121564507, "percentage": 54.71, "elapsed_time": "23:08:42", "remaining_time": "19:09:29", "throughput": 332.75, "total_tokens": 27725216} {"current_steps": 21890, "total_steps": 40000, "loss": 0.064, "lr": 0.1278272937126649, "epoch": 1.069577113820145, "percentage": 54.73, "elapsed_time": "23:08:45", "remaining_time": "19:08:56", "throughput": 332.81, "total_tokens": 27731456} {"current_steps": 21895, "total_steps": 40000, "loss": 0.0467, "lr": 0.1277690376566005, "epoch": 1.0698214154838395, "percentage": 54.74, "elapsed_time": "23:08:48", "remaining_time": "19:08:24", "throughput": 332.87, "total_tokens": 27737920} {"current_steps": 21900, "total_steps": 40000, "loss": 0.064, "lr": 0.12771078502882985, "epoch": 1.0700657171475338, "percentage": 54.75, "elapsed_time": "23:08:52", "remaining_time": "19:07:52", "throughput": 332.94, "total_tokens": 27744736} {"current_steps": 21905, "total_steps": 40000, "loss": 0.0553, "lr": 0.12765253583833633, "epoch": 1.070310018811228, "percentage": 54.76, "elapsed_time": "23:08:55", "remaining_time": "19:07:20", "throughput": 333.01, "total_tokens": 27751136} {"current_steps": 21910, "total_steps": 40000, "loss": 0.0714, "lr": 0.12759429009410256, "epoch": 1.0705543204749224, "percentage": 54.77, "elapsed_time": "23:08:58", "remaining_time": "19:06:48", "throughput": 333.07, "total_tokens": 27757408} {"current_steps": 21915, "total_steps": 40000, "loss": 0.0721, "lr": 0.12753604780511085, "epoch": 1.0707986221386168, "percentage": 54.79, "elapsed_time": "23:09:01", "remaining_time": "19:06:16", "throughput": 333.13, "total_tokens": 27763488} {"current_steps": 21920, "total_steps": 40000, "loss": 0.0761, "lr": 0.12747780898034283, "epoch": 1.0710429238023111, "percentage": 54.8, "elapsed_time": "23:09:04", "remaining_time": "19:05:43", "throughput": 333.2, "total_tokens": 27770304} {"current_steps": 21925, "total_steps": 40000, "loss": 0.0747, "lr": 0.12741957362877973, "epoch": 1.0712872254660055, "percentage": 54.81, "elapsed_time": "23:09:07", "remaining_time": "19:05:11", "throughput": 333.26, "total_tokens": 27776512} {"current_steps": 21930, "total_steps": 40000, "loss": 0.0708, "lr": 0.12736134175940214, "epoch": 1.0715315271296997, "percentage": 54.83, "elapsed_time": "23:09:10", "remaining_time": "19:04:39", "throughput": 333.33, "total_tokens": 27783072} {"current_steps": 21935, "total_steps": 40000, "loss": 0.0527, "lr": 0.12730311338119016, "epoch": 1.071775828793394, "percentage": 54.84, "elapsed_time": "23:09:13", "remaining_time": "19:04:07", "throughput": 333.4, "total_tokens": 27789760} {"current_steps": 21940, "total_steps": 40000, "loss": 0.0423, "lr": 0.12724488850312327, "epoch": 1.0720201304570884, "percentage": 54.85, "elapsed_time": "23:09:16", "remaining_time": "19:03:35", "throughput": 333.46, "total_tokens": 27796032} {"current_steps": 21945, "total_steps": 40000, "loss": 0.0584, "lr": 0.1271866671341806, "epoch": 1.0722644321207828, "percentage": 54.86, "elapsed_time": "23:09:20", "remaining_time": "19:03:03", "throughput": 333.52, "total_tokens": 27802560} {"current_steps": 21950, "total_steps": 40000, "loss": 0.0501, "lr": 0.12712844928334047, "epoch": 1.072508733784477, "percentage": 54.87, "elapsed_time": "23:09:23", "remaining_time": "19:02:31", "throughput": 333.59, "total_tokens": 27809184} {"current_steps": 21955, "total_steps": 40000, "loss": 0.0762, "lr": 0.12707023495958095, "epoch": 1.0727530354481714, "percentage": 54.89, "elapsed_time": "23:09:26", "remaining_time": "19:01:59", "throughput": 333.66, "total_tokens": 27815616} {"current_steps": 21960, "total_steps": 40000, "loss": 0.0683, "lr": 0.12701202417187932, "epoch": 1.0729973371118657, "percentage": 54.9, "elapsed_time": "23:09:29", "remaining_time": "19:01:27", "throughput": 333.72, "total_tokens": 27822208} {"current_steps": 21965, "total_steps": 40000, "loss": 0.0565, "lr": 0.12695381692921243, "epoch": 1.0732416387755601, "percentage": 54.91, "elapsed_time": "23:09:32", "remaining_time": "19:00:55", "throughput": 333.78, "total_tokens": 27828096} {"current_steps": 21970, "total_steps": 40000, "loss": 0.0812, "lr": 0.12689561324055665, "epoch": 1.0734859404392545, "percentage": 54.93, "elapsed_time": "23:09:35", "remaining_time": "19:00:23", "throughput": 333.85, "total_tokens": 27835008} {"current_steps": 21975, "total_steps": 40000, "loss": 0.0685, "lr": 0.12683741311488758, "epoch": 1.0737302421029487, "percentage": 54.94, "elapsed_time": "23:09:38", "remaining_time": "18:59:51", "throughput": 333.91, "total_tokens": 27841056} {"current_steps": 21980, "total_steps": 40000, "loss": 0.0388, "lr": 0.1267792165611805, "epoch": 1.073974543766643, "percentage": 54.95, "elapsed_time": "23:09:42", "remaining_time": "18:59:19", "throughput": 333.98, "total_tokens": 27847904} {"current_steps": 21985, "total_steps": 40000, "loss": 0.0415, "lr": 0.1267210235884101, "epoch": 1.0742188454303374, "percentage": 54.96, "elapsed_time": "23:09:45", "remaining_time": "18:58:47", "throughput": 334.05, "total_tokens": 27854656} {"current_steps": 21990, "total_steps": 40000, "loss": 0.0474, "lr": 0.12666283420555033, "epoch": 1.0744631470940318, "percentage": 54.97, "elapsed_time": "23:09:48", "remaining_time": "18:58:15", "throughput": 334.12, "total_tokens": 27861376} {"current_steps": 21995, "total_steps": 40000, "loss": 0.0688, "lr": 0.12660464842157487, "epoch": 1.074707448757726, "percentage": 54.99, "elapsed_time": "23:09:51", "remaining_time": "18:57:43", "throughput": 334.18, "total_tokens": 27867616} {"current_steps": 22000, "total_steps": 40000, "loss": 0.0295, "lr": 0.1265464662454566, "epoch": 1.0749517504214203, "percentage": 55.0, "elapsed_time": "23:09:54", "remaining_time": "18:57:12", "throughput": 334.25, "total_tokens": 27874656} {"current_steps": 22000, "total_steps": 40000, "eval_loss": 0.0643293485045433, "epoch": 1.0749517504214203, "percentage": 55.0, "elapsed_time": "23:20:35", "remaining_time": "19:05:55", "throughput": 331.7, "total_tokens": 27874656} {"current_steps": 22005, "total_steps": 40000, "loss": 0.0455, "lr": 0.12648828768616793, "epoch": 1.0751960520851147, "percentage": 55.01, "elapsed_time": "23:20:38", "remaining_time": "19:05:24", "throughput": 331.76, "total_tokens": 27881024} {"current_steps": 22010, "total_steps": 40000, "loss": 0.0914, "lr": 0.12643011275268085, "epoch": 1.075440353748809, "percentage": 55.02, "elapsed_time": "23:20:42", "remaining_time": "19:04:52", "throughput": 331.83, "total_tokens": 27887616} {"current_steps": 22015, "total_steps": 40000, "loss": 0.0394, "lr": 0.1263719414539665, "epoch": 1.0756846554125032, "percentage": 55.04, "elapsed_time": "23:20:45", "remaining_time": "19:04:20", "throughput": 331.89, "total_tokens": 27893344} {"current_steps": 22020, "total_steps": 40000, "loss": 0.0515, "lr": 0.1263137737989957, "epoch": 1.0759289570761976, "percentage": 55.05, "elapsed_time": "23:20:48", "remaining_time": "19:03:47", "throughput": 331.94, "total_tokens": 27899168} {"current_steps": 22025, "total_steps": 40000, "loss": 0.0482, "lr": 0.1262556097967387, "epoch": 1.076173258739892, "percentage": 55.06, "elapsed_time": "23:20:51", "remaining_time": "19:03:15", "throughput": 332.01, "total_tokens": 27905536} {"current_steps": 22030, "total_steps": 40000, "loss": 0.0829, "lr": 0.126197449456165, "epoch": 1.0764175604035864, "percentage": 55.07, "elapsed_time": "23:20:54", "remaining_time": "19:02:43", "throughput": 332.07, "total_tokens": 27911968} {"current_steps": 22035, "total_steps": 40000, "loss": 0.042, "lr": 0.12613929278624378, "epoch": 1.0766618620672808, "percentage": 55.09, "elapsed_time": "23:20:57", "remaining_time": "19:02:11", "throughput": 332.14, "total_tokens": 27918528} {"current_steps": 22040, "total_steps": 40000, "loss": 0.0621, "lr": 0.12608113979594343, "epoch": 1.076906163730975, "percentage": 55.1, "elapsed_time": "23:21:00", "remaining_time": "19:01:39", "throughput": 332.2, "total_tokens": 27924736} {"current_steps": 22045, "total_steps": 40000, "loss": 0.0695, "lr": 0.1260229904942319, "epoch": 1.0771504653946693, "percentage": 55.11, "elapsed_time": "23:21:03", "remaining_time": "19:01:07", "throughput": 332.26, "total_tokens": 27931040} {"current_steps": 22050, "total_steps": 40000, "loss": 0.0404, "lr": 0.12596484489007662, "epoch": 1.0773947670583637, "percentage": 55.12, "elapsed_time": "23:21:06", "remaining_time": "19:00:35", "throughput": 332.32, "total_tokens": 27936928} {"current_steps": 22055, "total_steps": 40000, "loss": 0.0464, "lr": 0.1259067029924442, "epoch": 1.077639068722058, "percentage": 55.14, "elapsed_time": "23:21:09", "remaining_time": "19:00:03", "throughput": 332.38, "total_tokens": 27942976} {"current_steps": 22060, "total_steps": 40000, "loss": 0.0747, "lr": 0.12584856481030096, "epoch": 1.0778833703857522, "percentage": 55.15, "elapsed_time": "23:21:12", "remaining_time": "18:59:30", "throughput": 332.44, "total_tokens": 27949056} {"current_steps": 22065, "total_steps": 40000, "loss": 0.0441, "lr": 0.12579043035261261, "epoch": 1.0781276720494466, "percentage": 55.16, "elapsed_time": "23:21:15", "remaining_time": "18:58:59", "throughput": 332.51, "total_tokens": 27955968} {"current_steps": 22070, "total_steps": 40000, "loss": 0.0715, "lr": 0.1257322996283441, "epoch": 1.078371973713141, "percentage": 55.17, "elapsed_time": "23:21:18", "remaining_time": "18:58:26", "throughput": 332.57, "total_tokens": 27961792} {"current_steps": 22075, "total_steps": 40000, "loss": 0.0403, "lr": 0.12567417264645994, "epoch": 1.0786162753768354, "percentage": 55.19, "elapsed_time": "23:21:22", "remaining_time": "18:57:54", "throughput": 332.63, "total_tokens": 27968128} {"current_steps": 22080, "total_steps": 40000, "loss": 0.0944, "lr": 0.12561604941592408, "epoch": 1.0788605770405297, "percentage": 55.2, "elapsed_time": "23:21:25", "remaining_time": "18:57:22", "throughput": 332.69, "total_tokens": 27974176} {"current_steps": 22085, "total_steps": 40000, "loss": 0.0796, "lr": 0.12555792994569978, "epoch": 1.079104878704224, "percentage": 55.21, "elapsed_time": "23:21:28", "remaining_time": "18:56:51", "throughput": 332.75, "total_tokens": 27980544} {"current_steps": 22090, "total_steps": 40000, "loss": 0.0682, "lr": 0.1254998142447499, "epoch": 1.0793491803679183, "percentage": 55.23, "elapsed_time": "23:21:31", "remaining_time": "18:56:18", "throughput": 332.81, "total_tokens": 27986208} {"current_steps": 22095, "total_steps": 40000, "loss": 0.1162, "lr": 0.1254417023220365, "epoch": 1.0795934820316127, "percentage": 55.24, "elapsed_time": "23:21:34", "remaining_time": "18:55:46", "throughput": 332.87, "total_tokens": 27992032} {"current_steps": 22100, "total_steps": 40000, "loss": 0.0613, "lr": 0.12538359418652126, "epoch": 1.079837783695307, "percentage": 55.25, "elapsed_time": "23:21:37", "remaining_time": "18:55:14", "throughput": 332.93, "total_tokens": 27998400} {"current_steps": 22105, "total_steps": 40000, "loss": 0.0544, "lr": 0.12532548984716513, "epoch": 1.0800820853590012, "percentage": 55.26, "elapsed_time": "23:21:40", "remaining_time": "18:54:42", "throughput": 332.99, "total_tokens": 28004704} {"current_steps": 22110, "total_steps": 40000, "loss": 0.0517, "lr": 0.12526738931292855, "epoch": 1.0803263870226956, "percentage": 55.27, "elapsed_time": "23:21:43", "remaining_time": "18:54:11", "throughput": 333.06, "total_tokens": 28011104} {"current_steps": 22115, "total_steps": 40000, "loss": 0.0857, "lr": 0.1252092925927714, "epoch": 1.08057068868639, "percentage": 55.29, "elapsed_time": "23:21:46", "remaining_time": "18:53:39", "throughput": 333.12, "total_tokens": 28017568} {"current_steps": 22120, "total_steps": 40000, "loss": 0.048, "lr": 0.12515119969565278, "epoch": 1.0808149903500843, "percentage": 55.3, "elapsed_time": "23:21:49", "remaining_time": "18:53:07", "throughput": 333.18, "total_tokens": 28023552} {"current_steps": 22125, "total_steps": 40000, "loss": 0.0689, "lr": 0.12509311063053144, "epoch": 1.0810592920137787, "percentage": 55.31, "elapsed_time": "23:21:52", "remaining_time": "18:52:35", "throughput": 333.24, "total_tokens": 28029312} {"current_steps": 22130, "total_steps": 40000, "loss": 0.0469, "lr": 0.1250350254063655, "epoch": 1.0813035936774729, "percentage": 55.33, "elapsed_time": "23:21:55", "remaining_time": "18:52:03", "throughput": 333.3, "total_tokens": 28035616} {"current_steps": 22135, "total_steps": 40000, "loss": 0.0447, "lr": 0.1249769440321123, "epoch": 1.0815478953411672, "percentage": 55.34, "elapsed_time": "23:21:58", "remaining_time": "18:51:31", "throughput": 333.36, "total_tokens": 28041696} {"current_steps": 22140, "total_steps": 40000, "loss": 0.0661, "lr": 0.12491886651672884, "epoch": 1.0817921970048616, "percentage": 55.35, "elapsed_time": "23:22:01", "remaining_time": "18:50:59", "throughput": 333.42, "total_tokens": 28047968} {"current_steps": 22145, "total_steps": 40000, "loss": 0.0823, "lr": 0.12486079286917139, "epoch": 1.082036498668556, "percentage": 55.36, "elapsed_time": "23:22:04", "remaining_time": "18:50:27", "throughput": 333.48, "total_tokens": 28053856} {"current_steps": 22150, "total_steps": 40000, "loss": 0.0739, "lr": 0.12480272309839553, "epoch": 1.0822808003322502, "percentage": 55.38, "elapsed_time": "23:22:07", "remaining_time": "18:49:55", "throughput": 333.54, "total_tokens": 28059904} {"current_steps": 22155, "total_steps": 40000, "loss": 0.0724, "lr": 0.12474465721335648, "epoch": 1.0825251019959445, "percentage": 55.39, "elapsed_time": "23:22:10", "remaining_time": "18:49:24", "throughput": 333.6, "total_tokens": 28065920} {"current_steps": 22160, "total_steps": 40000, "loss": 0.0408, "lr": 0.12468659522300861, "epoch": 1.082769403659639, "percentage": 55.4, "elapsed_time": "23:22:13", "remaining_time": "18:48:52", "throughput": 333.67, "total_tokens": 28072928} {"current_steps": 22165, "total_steps": 40000, "loss": 0.0473, "lr": 0.12462853713630584, "epoch": 1.0830137053233333, "percentage": 55.41, "elapsed_time": "23:22:17", "remaining_time": "18:48:20", "throughput": 333.73, "total_tokens": 28079200} {"current_steps": 22170, "total_steps": 40000, "loss": 0.0731, "lr": 0.12457048296220156, "epoch": 1.0832580069870277, "percentage": 55.43, "elapsed_time": "23:22:20", "remaining_time": "18:47:48", "throughput": 333.79, "total_tokens": 28085184} {"current_steps": 22175, "total_steps": 40000, "loss": 0.0641, "lr": 0.12451243270964832, "epoch": 1.0835023086507218, "percentage": 55.44, "elapsed_time": "23:22:23", "remaining_time": "18:47:17", "throughput": 333.85, "total_tokens": 28091616} {"current_steps": 22180, "total_steps": 40000, "loss": 0.064, "lr": 0.12445438638759827, "epoch": 1.0837466103144162, "percentage": 55.45, "elapsed_time": "23:22:26", "remaining_time": "18:46:45", "throughput": 333.92, "total_tokens": 28097824} {"current_steps": 22185, "total_steps": 40000, "loss": 0.0655, "lr": 0.1243963440050029, "epoch": 1.0839909119781106, "percentage": 55.46, "elapsed_time": "23:22:29", "remaining_time": "18:46:13", "throughput": 333.98, "total_tokens": 28103904} {"current_steps": 22190, "total_steps": 40000, "loss": 0.0343, "lr": 0.12433830557081298, "epoch": 1.084235213641805, "percentage": 55.47, "elapsed_time": "23:22:32", "remaining_time": "18:45:41", "throughput": 334.04, "total_tokens": 28110432} {"current_steps": 22195, "total_steps": 40000, "loss": 0.0621, "lr": 0.12428027109397889, "epoch": 1.0844795153054991, "percentage": 55.49, "elapsed_time": "23:22:35", "remaining_time": "18:45:10", "throughput": 334.1, "total_tokens": 28116576} {"current_steps": 22200, "total_steps": 40000, "loss": 0.0573, "lr": 0.12422224058345015, "epoch": 1.0847238169691935, "percentage": 55.5, "elapsed_time": "23:22:38", "remaining_time": "18:44:38", "throughput": 334.16, "total_tokens": 28122656} {"current_steps": 22200, "total_steps": 40000, "eval_loss": 0.06396724283695221, "epoch": 1.0847238169691935, "percentage": 55.5, "elapsed_time": "23:33:19", "remaining_time": "18:53:12", "throughput": 331.64, "total_tokens": 28122656} {"current_steps": 22205, "total_steps": 40000, "loss": 0.0542, "lr": 0.12416421404817583, "epoch": 1.084968118632888, "percentage": 55.51, "elapsed_time": "23:33:22", "remaining_time": "18:52:40", "throughput": 331.7, "total_tokens": 28129184} {"current_steps": 22210, "total_steps": 40000, "loss": 0.0886, "lr": 0.12410619149710447, "epoch": 1.0852124202965823, "percentage": 55.53, "elapsed_time": "23:33:26", "remaining_time": "18:52:08", "throughput": 331.77, "total_tokens": 28135840} {"current_steps": 22215, "total_steps": 40000, "loss": 0.091, "lr": 0.12404817293918374, "epoch": 1.0854567219602766, "percentage": 55.54, "elapsed_time": "23:33:29", "remaining_time": "18:51:37", "throughput": 331.83, "total_tokens": 28142304} {"current_steps": 22220, "total_steps": 40000, "loss": 0.0425, "lr": 0.12399015838336086, "epoch": 1.0857010236239708, "percentage": 55.55, "elapsed_time": "23:33:32", "remaining_time": "18:51:05", "throughput": 331.9, "total_tokens": 28148960} {"current_steps": 22225, "total_steps": 40000, "loss": 0.0602, "lr": 0.12393214783858246, "epoch": 1.0859453252876652, "percentage": 55.56, "elapsed_time": "23:33:35", "remaining_time": "18:50:33", "throughput": 331.96, "total_tokens": 28155264} {"current_steps": 22230, "total_steps": 40000, "loss": 0.0833, "lr": 0.1238741413137944, "epoch": 1.0861896269513596, "percentage": 55.57, "elapsed_time": "23:33:38", "remaining_time": "18:50:01", "throughput": 332.02, "total_tokens": 28161600} {"current_steps": 22235, "total_steps": 40000, "loss": 0.0751, "lr": 0.12381613881794212, "epoch": 1.086433928615054, "percentage": 55.59, "elapsed_time": "23:33:41", "remaining_time": "18:49:29", "throughput": 332.08, "total_tokens": 28167456} {"current_steps": 22240, "total_steps": 40000, "loss": 0.0358, "lr": 0.12375814035997022, "epoch": 1.086678230278748, "percentage": 55.6, "elapsed_time": "23:33:44", "remaining_time": "18:48:57", "throughput": 332.14, "total_tokens": 28173312} {"current_steps": 22245, "total_steps": 40000, "loss": 0.0658, "lr": 0.12370014594882285, "epoch": 1.0869225319424425, "percentage": 55.61, "elapsed_time": "23:33:47", "remaining_time": "18:48:25", "throughput": 332.2, "total_tokens": 28179648} {"current_steps": 22250, "total_steps": 40000, "loss": 0.0713, "lr": 0.12364215559344356, "epoch": 1.0871668336061369, "percentage": 55.62, "elapsed_time": "23:33:50", "remaining_time": "18:47:53", "throughput": 332.26, "total_tokens": 28185696} {"current_steps": 22255, "total_steps": 40000, "loss": 0.1015, "lr": 0.12358416930277506, "epoch": 1.0874111352698312, "percentage": 55.64, "elapsed_time": "23:33:53", "remaining_time": "18:47:22", "throughput": 332.32, "total_tokens": 28192064} {"current_steps": 22260, "total_steps": 40000, "loss": 0.0579, "lr": 0.1235261870857596, "epoch": 1.0876554369335256, "percentage": 55.65, "elapsed_time": "23:33:56", "remaining_time": "18:46:50", "throughput": 332.39, "total_tokens": 28199296} {"current_steps": 22265, "total_steps": 40000, "loss": 0.0452, "lr": 0.12346820895133884, "epoch": 1.0878997385972198, "percentage": 55.66, "elapsed_time": "23:34:00", "remaining_time": "18:46:18", "throughput": 332.46, "total_tokens": 28205888} {"current_steps": 22270, "total_steps": 40000, "loss": 0.0658, "lr": 0.12341023490845361, "epoch": 1.0881440402609142, "percentage": 55.67, "elapsed_time": "23:34:03", "remaining_time": "18:45:47", "throughput": 332.53, "total_tokens": 28212544} {"current_steps": 22275, "total_steps": 40000, "loss": 0.0521, "lr": 0.12335226496604437, "epoch": 1.0883883419246085, "percentage": 55.69, "elapsed_time": "23:34:06", "remaining_time": "18:45:15", "throughput": 332.59, "total_tokens": 28219104} {"current_steps": 22280, "total_steps": 40000, "loss": 0.0458, "lr": 0.12329429913305069, "epoch": 1.088632643588303, "percentage": 55.7, "elapsed_time": "23:34:09", "remaining_time": "18:44:43", "throughput": 332.65, "total_tokens": 28225408} {"current_steps": 22285, "total_steps": 40000, "loss": 0.0535, "lr": 0.12323633741841171, "epoch": 1.088876945251997, "percentage": 55.71, "elapsed_time": "23:34:12", "remaining_time": "18:44:11", "throughput": 332.72, "total_tokens": 28232128} {"current_steps": 22290, "total_steps": 40000, "loss": 0.0632, "lr": 0.12317837983106583, "epoch": 1.0891212469156915, "percentage": 55.73, "elapsed_time": "23:34:15", "remaining_time": "18:43:40", "throughput": 332.78, "total_tokens": 28238240} {"current_steps": 22295, "total_steps": 40000, "loss": 0.0636, "lr": 0.12312042637995087, "epoch": 1.0893655485793858, "percentage": 55.74, "elapsed_time": "23:34:18", "remaining_time": "18:43:08", "throughput": 332.84, "total_tokens": 28244544} {"current_steps": 22300, "total_steps": 40000, "loss": 0.0787, "lr": 0.12306247707400389, "epoch": 1.0896098502430802, "percentage": 55.75, "elapsed_time": "23:34:22", "remaining_time": "18:42:36", "throughput": 332.91, "total_tokens": 28251136} {"current_steps": 22305, "total_steps": 40000, "loss": 0.0438, "lr": 0.12300453192216154, "epoch": 1.0898541519067746, "percentage": 55.76, "elapsed_time": "23:34:25", "remaining_time": "18:42:05", "throughput": 332.96, "total_tokens": 28257120} {"current_steps": 22310, "total_steps": 40000, "loss": 0.0513, "lr": 0.12294659093335956, "epoch": 1.0900984535704688, "percentage": 55.77, "elapsed_time": "23:34:28", "remaining_time": "18:41:33", "throughput": 333.03, "total_tokens": 28263360} {"current_steps": 22315, "total_steps": 40000, "loss": 0.0673, "lr": 0.12288865411653327, "epoch": 1.0903427552341631, "percentage": 55.79, "elapsed_time": "23:34:31", "remaining_time": "18:41:01", "throughput": 333.09, "total_tokens": 28269472} {"current_steps": 22320, "total_steps": 40000, "loss": 0.0631, "lr": 0.12283072148061717, "epoch": 1.0905870568978575, "percentage": 55.8, "elapsed_time": "23:34:34", "remaining_time": "18:40:30", "throughput": 333.14, "total_tokens": 28275456} {"current_steps": 22325, "total_steps": 40000, "loss": 0.0893, "lr": 0.12277279303454529, "epoch": 1.090831358561552, "percentage": 55.81, "elapsed_time": "23:34:37", "remaining_time": "18:39:58", "throughput": 333.2, "total_tokens": 28281504} {"current_steps": 22330, "total_steps": 40000, "loss": 0.0503, "lr": 0.12271486878725091, "epoch": 1.091075660225246, "percentage": 55.83, "elapsed_time": "23:34:40", "remaining_time": "18:39:26", "throughput": 333.27, "total_tokens": 28288000} {"current_steps": 22335, "total_steps": 40000, "loss": 0.0417, "lr": 0.12265694874766658, "epoch": 1.0913199618889404, "percentage": 55.84, "elapsed_time": "23:34:43", "remaining_time": "18:38:55", "throughput": 333.33, "total_tokens": 28294304} {"current_steps": 22340, "total_steps": 40000, "loss": 0.0791, "lr": 0.12259903292472435, "epoch": 1.0915642635526348, "percentage": 55.85, "elapsed_time": "23:34:46", "remaining_time": "18:38:23", "throughput": 333.39, "total_tokens": 28300544} {"current_steps": 22345, "total_steps": 40000, "loss": 0.0466, "lr": 0.12254112132735567, "epoch": 1.0918085652163292, "percentage": 55.86, "elapsed_time": "23:34:49", "remaining_time": "18:37:52", "throughput": 333.45, "total_tokens": 28306848} {"current_steps": 22350, "total_steps": 40000, "loss": 0.0542, "lr": 0.12248321396449108, "epoch": 1.0920528668800236, "percentage": 55.88, "elapsed_time": "23:34:52", "remaining_time": "18:37:20", "throughput": 333.52, "total_tokens": 28313120} {"current_steps": 22355, "total_steps": 40000, "loss": 0.056, "lr": 0.12242531084506075, "epoch": 1.0922971685437177, "percentage": 55.89, "elapsed_time": "23:34:55", "remaining_time": "18:36:49", "throughput": 333.58, "total_tokens": 28319904} {"current_steps": 22360, "total_steps": 40000, "loss": 0.0322, "lr": 0.122367411977994, "epoch": 1.092541470207412, "percentage": 55.9, "elapsed_time": "23:34:59", "remaining_time": "18:36:17", "throughput": 333.65, "total_tokens": 28326464} {"current_steps": 22365, "total_steps": 40000, "loss": 0.0431, "lr": 0.12230951737221954, "epoch": 1.0927857718711065, "percentage": 55.91, "elapsed_time": "23:35:02", "remaining_time": "18:35:46", "throughput": 333.71, "total_tokens": 28332992} {"current_steps": 22370, "total_steps": 40000, "loss": 0.062, "lr": 0.12225162703666555, "epoch": 1.0930300735348009, "percentage": 55.93, "elapsed_time": "23:35:05", "remaining_time": "18:35:14", "throughput": 333.78, "total_tokens": 28339424} {"current_steps": 22375, "total_steps": 40000, "loss": 0.0888, "lr": 0.1221937409802593, "epoch": 1.093274375198495, "percentage": 55.94, "elapsed_time": "23:35:08", "remaining_time": "18:34:43", "throughput": 333.84, "total_tokens": 28345696} {"current_steps": 22380, "total_steps": 40000, "loss": 0.0468, "lr": 0.12213585921192768, "epoch": 1.0935186768621894, "percentage": 55.95, "elapsed_time": "23:35:11", "remaining_time": "18:34:11", "throughput": 333.9, "total_tokens": 28352064} {"current_steps": 22385, "total_steps": 40000, "loss": 0.0394, "lr": 0.1220779817405967, "epoch": 1.0937629785258838, "percentage": 55.96, "elapsed_time": "23:35:14", "remaining_time": "18:33:40", "throughput": 333.96, "total_tokens": 28357856} {"current_steps": 22390, "total_steps": 40000, "loss": 0.054, "lr": 0.12202010857519181, "epoch": 1.0940072801895782, "percentage": 55.97, "elapsed_time": "23:35:17", "remaining_time": "18:33:08", "throughput": 334.02, "total_tokens": 28364384} {"current_steps": 22395, "total_steps": 40000, "loss": 0.071, "lr": 0.12196223972463785, "epoch": 1.0942515818532725, "percentage": 55.99, "elapsed_time": "23:35:20", "remaining_time": "18:32:37", "throughput": 334.08, "total_tokens": 28370400} {"current_steps": 22400, "total_steps": 40000, "loss": 0.0603, "lr": 0.12190437519785885, "epoch": 1.0944958835169667, "percentage": 56.0, "elapsed_time": "23:35:23", "remaining_time": "18:32:05", "throughput": 334.14, "total_tokens": 28376640} {"current_steps": 22400, "total_steps": 40000, "eval_loss": 0.0651206523180008, "epoch": 1.0944958835169667, "percentage": 56.0, "elapsed_time": "23:46:04", "remaining_time": "18:40:28", "throughput": 331.64, "total_tokens": 28376640} {"current_steps": 22405, "total_steps": 40000, "loss": 0.0844, "lr": 0.12184651500377823, "epoch": 1.094740185180661, "percentage": 56.01, "elapsed_time": "23:46:07", "remaining_time": "18:39:57", "throughput": 331.7, "total_tokens": 28382816} {"current_steps": 22410, "total_steps": 40000, "loss": 0.0672, "lr": 0.12178865915131885, "epoch": 1.0949844868443555, "percentage": 56.03, "elapsed_time": "23:46:10", "remaining_time": "18:39:26", "throughput": 331.76, "total_tokens": 28389088} {"current_steps": 22415, "total_steps": 40000, "loss": 0.0546, "lr": 0.1217308076494027, "epoch": 1.0952287885080498, "percentage": 56.04, "elapsed_time": "23:46:13", "remaining_time": "18:38:54", "throughput": 331.82, "total_tokens": 28395264} {"current_steps": 22420, "total_steps": 40000, "loss": 0.0619, "lr": 0.12167296050695134, "epoch": 1.095473090171744, "percentage": 56.05, "elapsed_time": "23:46:16", "remaining_time": "18:38:22", "throughput": 331.88, "total_tokens": 28401408} {"current_steps": 22425, "total_steps": 40000, "loss": 0.0556, "lr": 0.12161511773288536, "epoch": 1.0957173918354384, "percentage": 56.06, "elapsed_time": "23:46:20", "remaining_time": "18:37:51", "throughput": 331.94, "total_tokens": 28407776} {"current_steps": 22430, "total_steps": 40000, "loss": 0.056, "lr": 0.121557279336125, "epoch": 1.0959616934991327, "percentage": 56.07, "elapsed_time": "23:46:23", "remaining_time": "18:37:19", "throughput": 332.0, "total_tokens": 28413600} {"current_steps": 22435, "total_steps": 40000, "loss": 0.0736, "lr": 0.12149944532558957, "epoch": 1.0962059951628271, "percentage": 56.09, "elapsed_time": "23:46:26", "remaining_time": "18:36:47", "throughput": 332.06, "total_tokens": 28419616} {"current_steps": 22440, "total_steps": 40000, "loss": 0.0534, "lr": 0.12144161571019785, "epoch": 1.0964502968265213, "percentage": 56.1, "elapsed_time": "23:46:29", "remaining_time": "18:36:16", "throughput": 332.12, "total_tokens": 28425632} {"current_steps": 22445, "total_steps": 40000, "loss": 0.0738, "lr": 0.12138379049886781, "epoch": 1.0966945984902157, "percentage": 56.11, "elapsed_time": "23:46:32", "remaining_time": "18:35:44", "throughput": 332.18, "total_tokens": 28432160} {"current_steps": 22450, "total_steps": 40000, "loss": 0.0607, "lr": 0.12132596970051697, "epoch": 1.09693890015391, "percentage": 56.12, "elapsed_time": "23:46:35", "remaining_time": "18:35:13", "throughput": 332.25, "total_tokens": 28438720} {"current_steps": 22455, "total_steps": 40000, "loss": 0.0607, "lr": 0.12126815332406189, "epoch": 1.0971832018176044, "percentage": 56.14, "elapsed_time": "23:46:38", "remaining_time": "18:34:41", "throughput": 332.31, "total_tokens": 28445184} {"current_steps": 22460, "total_steps": 40000, "loss": 0.0514, "lr": 0.12121034137841868, "epoch": 1.0974275034812988, "percentage": 56.15, "elapsed_time": "23:46:41", "remaining_time": "18:34:10", "throughput": 332.37, "total_tokens": 28451616} {"current_steps": 22465, "total_steps": 40000, "loss": 0.0503, "lr": 0.12115253387250258, "epoch": 1.097671805144993, "percentage": 56.16, "elapsed_time": "23:46:44", "remaining_time": "18:33:38", "throughput": 332.44, "total_tokens": 28458176} {"current_steps": 22470, "total_steps": 40000, "loss": 0.0701, "lr": 0.12109473081522831, "epoch": 1.0979161068086873, "percentage": 56.17, "elapsed_time": "23:46:47", "remaining_time": "18:33:07", "throughput": 332.5, "total_tokens": 28464832} {"current_steps": 22475, "total_steps": 40000, "loss": 0.0515, "lr": 0.12103693221550982, "epoch": 1.0981604084723817, "percentage": 56.19, "elapsed_time": "23:46:50", "remaining_time": "18:32:35", "throughput": 332.56, "total_tokens": 28471136} {"current_steps": 22480, "total_steps": 40000, "loss": 0.071, "lr": 0.12097913808226027, "epoch": 1.098404710136076, "percentage": 56.2, "elapsed_time": "23:46:54", "remaining_time": "18:32:04", "throughput": 332.63, "total_tokens": 28477792} {"current_steps": 22485, "total_steps": 40000, "loss": 0.049, "lr": 0.12092134842439234, "epoch": 1.0986490117997703, "percentage": 56.21, "elapsed_time": "23:46:57", "remaining_time": "18:31:32", "throughput": 332.69, "total_tokens": 28484000} {"current_steps": 22490, "total_steps": 40000, "loss": 0.0666, "lr": 0.12086356325081798, "epoch": 1.0988933134634646, "percentage": 56.23, "elapsed_time": "23:47:00", "remaining_time": "18:31:01", "throughput": 332.75, "total_tokens": 28490304} {"current_steps": 22495, "total_steps": 40000, "loss": 0.0347, "lr": 0.12080578257044824, "epoch": 1.099137615127159, "percentage": 56.24, "elapsed_time": "23:47:03", "remaining_time": "18:30:29", "throughput": 332.82, "total_tokens": 28497568} {"current_steps": 22500, "total_steps": 40000, "loss": 0.0465, "lr": 0.12074800639219378, "epoch": 1.0993819167908534, "percentage": 56.25, "elapsed_time": "23:47:06", "remaining_time": "18:29:58", "throughput": 332.89, "total_tokens": 28504640} {"current_steps": 22505, "total_steps": 40000, "loss": 0.0459, "lr": 0.12069023472496428, "epoch": 1.0996262184545478, "percentage": 56.26, "elapsed_time": "23:47:09", "remaining_time": "18:29:27", "throughput": 332.96, "total_tokens": 28511232} {"current_steps": 22510, "total_steps": 40000, "loss": 0.0436, "lr": 0.12063246757766893, "epoch": 1.099870520118242, "percentage": 56.27, "elapsed_time": "23:47:13", "remaining_time": "18:28:55", "throughput": 333.02, "total_tokens": 28517504} {"current_steps": 22515, "total_steps": 40000, "loss": 0.0786, "lr": 0.12057470495921618, "epoch": 1.1001148217819363, "percentage": 56.29, "elapsed_time": "23:47:16", "remaining_time": "18:28:24", "throughput": 333.08, "total_tokens": 28523296} {"current_steps": 22520, "total_steps": 40000, "loss": 0.0589, "lr": 0.12051694687851364, "epoch": 1.1003591234456307, "percentage": 56.3, "elapsed_time": "23:47:19", "remaining_time": "18:27:52", "throughput": 333.14, "total_tokens": 28529472} {"current_steps": 22525, "total_steps": 40000, "loss": 0.0567, "lr": 0.12045919334446839, "epoch": 1.100603425109325, "percentage": 56.31, "elapsed_time": "23:47:22", "remaining_time": "18:27:21", "throughput": 333.2, "total_tokens": 28535744} {"current_steps": 22530, "total_steps": 40000, "loss": 0.0537, "lr": 0.12040144436598683, "epoch": 1.1008477267730192, "percentage": 56.33, "elapsed_time": "23:47:25", "remaining_time": "18:26:50", "throughput": 333.26, "total_tokens": 28542368} {"current_steps": 22535, "total_steps": 40000, "loss": 0.0345, "lr": 0.12034369995197444, "epoch": 1.1010920284367136, "percentage": 56.34, "elapsed_time": "23:47:28", "remaining_time": "18:26:18", "throughput": 333.32, "total_tokens": 28548608} {"current_steps": 22540, "total_steps": 40000, "loss": 0.0732, "lr": 0.12028596011133627, "epoch": 1.101336330100408, "percentage": 56.35, "elapsed_time": "23:47:31", "remaining_time": "18:25:47", "throughput": 333.38, "total_tokens": 28554784} {"current_steps": 22545, "total_steps": 40000, "loss": 0.0413, "lr": 0.12022822485297643, "epoch": 1.1015806317641024, "percentage": 56.36, "elapsed_time": "23:47:34", "remaining_time": "18:25:16", "throughput": 333.44, "total_tokens": 28560928} {"current_steps": 22550, "total_steps": 40000, "loss": 0.0651, "lr": 0.12017049418579843, "epoch": 1.1018249334277965, "percentage": 56.38, "elapsed_time": "23:47:37", "remaining_time": "18:24:44", "throughput": 333.5, "total_tokens": 28566816} {"current_steps": 22555, "total_steps": 40000, "loss": 0.0396, "lr": 0.12011276811870514, "epoch": 1.102069235091491, "percentage": 56.39, "elapsed_time": "23:47:40", "remaining_time": "18:24:13", "throughput": 333.57, "total_tokens": 28573728} {"current_steps": 22560, "total_steps": 40000, "loss": 0.0526, "lr": 0.12005504666059852, "epoch": 1.1023135367551853, "percentage": 56.4, "elapsed_time": "23:47:43", "remaining_time": "18:23:42", "throughput": 333.63, "total_tokens": 28580288} {"current_steps": 22565, "total_steps": 40000, "loss": 0.0495, "lr": 0.11999732982038003, "epoch": 1.1025578384188797, "percentage": 56.41, "elapsed_time": "23:47:46", "remaining_time": "18:23:11", "throughput": 333.69, "total_tokens": 28586400} {"current_steps": 22570, "total_steps": 40000, "loss": 0.0353, "lr": 0.11993961760695038, "epoch": 1.102802140082574, "percentage": 56.43, "elapsed_time": "23:47:49", "remaining_time": "18:22:39", "throughput": 333.75, "total_tokens": 28592608} {"current_steps": 22575, "total_steps": 40000, "loss": 0.0543, "lr": 0.11988191002920942, "epoch": 1.1030464417462682, "percentage": 56.44, "elapsed_time": "23:47:52", "remaining_time": "18:22:08", "throughput": 333.81, "total_tokens": 28598464} {"current_steps": 22580, "total_steps": 40000, "loss": 0.0392, "lr": 0.11982420709605641, "epoch": 1.1032907434099626, "percentage": 56.45, "elapsed_time": "23:47:56", "remaining_time": "18:21:37", "throughput": 333.87, "total_tokens": 28604800} {"current_steps": 22585, "total_steps": 40000, "loss": 0.055, "lr": 0.11976650881638991, "epoch": 1.103535045073657, "percentage": 56.46, "elapsed_time": "23:47:59", "remaining_time": "18:21:06", "throughput": 333.93, "total_tokens": 28611040} {"current_steps": 22590, "total_steps": 40000, "loss": 0.0453, "lr": 0.11970881519910764, "epoch": 1.1037793467373513, "percentage": 56.47, "elapsed_time": "23:48:02", "remaining_time": "18:20:34", "throughput": 333.99, "total_tokens": 28616960} {"current_steps": 22595, "total_steps": 40000, "loss": 0.0732, "lr": 0.1196511262531068, "epoch": 1.1040236484010455, "percentage": 56.49, "elapsed_time": "23:48:05", "remaining_time": "18:20:03", "throughput": 334.05, "total_tokens": 28622976} {"current_steps": 22600, "total_steps": 40000, "loss": 0.0644, "lr": 0.11959344198728361, "epoch": 1.1042679500647399, "percentage": 56.5, "elapsed_time": "23:48:08", "remaining_time": "18:19:32", "throughput": 334.11, "total_tokens": 28629632} {"current_steps": 22600, "total_steps": 40000, "eval_loss": 0.06440416723489761, "epoch": 1.1042679500647399, "percentage": 56.5, "elapsed_time": "23:58:48", "remaining_time": "18:27:45", "throughput": 331.63, "total_tokens": 28629632} {"current_steps": 22605, "total_steps": 40000, "loss": 0.0272, "lr": 0.11953576241053378, "epoch": 1.1045122517284343, "percentage": 56.51, "elapsed_time": "23:58:52", "remaining_time": "18:27:14", "throughput": 331.7, "total_tokens": 28636320} {"current_steps": 22610, "total_steps": 40000, "loss": 0.0508, "lr": 0.11947808753175228, "epoch": 1.1047565533921286, "percentage": 56.53, "elapsed_time": "23:58:55", "remaining_time": "18:26:43", "throughput": 331.76, "total_tokens": 28643040} {"current_steps": 22615, "total_steps": 40000, "loss": 0.0498, "lr": 0.1194204173598332, "epoch": 1.105000855055823, "percentage": 56.54, "elapsed_time": "23:58:58", "remaining_time": "18:26:12", "throughput": 331.83, "total_tokens": 28649504} {"current_steps": 22620, "total_steps": 40000, "loss": 0.0431, "lr": 0.11936275190367007, "epoch": 1.1052451567195172, "percentage": 56.55, "elapsed_time": "23:59:02", "remaining_time": "18:25:40", "throughput": 331.89, "total_tokens": 28656064} {"current_steps": 22625, "total_steps": 40000, "loss": 0.0776, "lr": 0.11930509117215563, "epoch": 1.1054894583832116, "percentage": 56.56, "elapsed_time": "23:59:05", "remaining_time": "18:25:09", "throughput": 331.95, "total_tokens": 28662272} {"current_steps": 22630, "total_steps": 40000, "loss": 0.0808, "lr": 0.11924743517418179, "epoch": 1.105733760046906, "percentage": 56.57, "elapsed_time": "23:59:08", "remaining_time": "18:24:37", "throughput": 332.01, "total_tokens": 28668384} {"current_steps": 22635, "total_steps": 40000, "loss": 0.0356, "lr": 0.11918978391864, "epoch": 1.1059780617106003, "percentage": 56.59, "elapsed_time": "23:59:11", "remaining_time": "18:24:06", "throughput": 332.07, "total_tokens": 28674656} {"current_steps": 22640, "total_steps": 40000, "loss": 0.0628, "lr": 0.11913213741442065, "epoch": 1.1062223633742945, "percentage": 56.6, "elapsed_time": "23:59:14", "remaining_time": "18:23:35", "throughput": 332.13, "total_tokens": 28680608} {"current_steps": 22645, "total_steps": 40000, "loss": 0.0687, "lr": 0.11907449567041364, "epoch": 1.1064666650379889, "percentage": 56.61, "elapsed_time": "23:59:17", "remaining_time": "18:23:03", "throughput": 332.19, "total_tokens": 28686816} {"current_steps": 22650, "total_steps": 40000, "loss": 0.0475, "lr": 0.11901685869550803, "epoch": 1.1067109667016832, "percentage": 56.62, "elapsed_time": "23:59:20", "remaining_time": "18:22:32", "throughput": 332.25, "total_tokens": 28693408} {"current_steps": 22655, "total_steps": 40000, "loss": 0.0339, "lr": 0.1189592264985922, "epoch": 1.1069552683653776, "percentage": 56.64, "elapsed_time": "23:59:23", "remaining_time": "18:22:01", "throughput": 332.31, "total_tokens": 28699808} {"current_steps": 22660, "total_steps": 40000, "loss": 0.0809, "lr": 0.11890159908855373, "epoch": 1.107199570029072, "percentage": 56.65, "elapsed_time": "23:59:26", "remaining_time": "18:21:29", "throughput": 332.37, "total_tokens": 28706016} {"current_steps": 22665, "total_steps": 40000, "loss": 0.0671, "lr": 0.11884397647427941, "epoch": 1.1074438716927661, "percentage": 56.66, "elapsed_time": "23:59:29", "remaining_time": "18:20:58", "throughput": 332.43, "total_tokens": 28712224} {"current_steps": 22670, "total_steps": 40000, "loss": 0.0999, "lr": 0.11878635866465546, "epoch": 1.1076881733564605, "percentage": 56.67, "elapsed_time": "23:59:32", "remaining_time": "18:20:27", "throughput": 332.49, "total_tokens": 28718336} {"current_steps": 22675, "total_steps": 40000, "loss": 0.0499, "lr": 0.11872874566856734, "epoch": 1.107932475020155, "percentage": 56.69, "elapsed_time": "23:59:36", "remaining_time": "18:19:56", "throughput": 332.56, "total_tokens": 28725344} {"current_steps": 22680, "total_steps": 40000, "loss": 0.0718, "lr": 0.11867113749489955, "epoch": 1.1081767766838493, "percentage": 56.7, "elapsed_time": "23:59:39", "remaining_time": "18:19:24", "throughput": 332.62, "total_tokens": 28731264} {"current_steps": 22685, "total_steps": 40000, "loss": 0.0876, "lr": 0.11861353415253607, "epoch": 1.1084210783475434, "percentage": 56.71, "elapsed_time": "23:59:42", "remaining_time": "18:18:53", "throughput": 332.68, "total_tokens": 28737568} {"current_steps": 22690, "total_steps": 40000, "loss": 0.0568, "lr": 0.11855593565036011, "epoch": 1.1086653800112378, "percentage": 56.73, "elapsed_time": "23:59:45", "remaining_time": "18:18:22", "throughput": 332.74, "total_tokens": 28744064} {"current_steps": 22695, "total_steps": 40000, "loss": 0.0496, "lr": 0.11849834199725394, "epoch": 1.1089096816749322, "percentage": 56.74, "elapsed_time": "23:59:48", "remaining_time": "18:17:51", "throughput": 332.8, "total_tokens": 28749920} {"current_steps": 22700, "total_steps": 40000, "loss": 0.0702, "lr": 0.1184407532020994, "epoch": 1.1091539833386266, "percentage": 56.75, "elapsed_time": "23:59:51", "remaining_time": "18:17:19", "throughput": 332.85, "total_tokens": 28755584} {"current_steps": 22705, "total_steps": 40000, "loss": 0.053, "lr": 0.11838316927377723, "epoch": 1.109398285002321, "percentage": 56.76, "elapsed_time": "23:59:54", "remaining_time": "18:16:48", "throughput": 332.92, "total_tokens": 28762016} {"current_steps": 22710, "total_steps": 40000, "loss": 0.0791, "lr": 0.11832559022116766, "epoch": 1.1096425866660151, "percentage": 56.77, "elapsed_time": "23:59:57", "remaining_time": "18:16:17", "throughput": 332.98, "total_tokens": 28768416} {"current_steps": 22715, "total_steps": 40000, "loss": 0.0442, "lr": 0.11826801605315022, "epoch": 1.1098868883297095, "percentage": 56.79, "elapsed_time": "1 day, 0:00:00", "remaining_time": "18:15:46", "throughput": 333.04, "total_tokens": 28774432} {"current_steps": 22720, "total_steps": 40000, "loss": 0.0451, "lr": 0.1182104467786034, "epoch": 1.1101311899934039, "percentage": 56.8, "elapsed_time": "1 day, 0:00:03", "remaining_time": "18:15:15", "throughput": 333.1, "total_tokens": 28781312} {"current_steps": 22725, "total_steps": 40000, "loss": 0.0599, "lr": 0.1181528824064052, "epoch": 1.1103754916570983, "percentage": 56.81, "elapsed_time": "1 day, 0:00:06", "remaining_time": "18:14:44", "throughput": 333.16, "total_tokens": 28787616} {"current_steps": 22730, "total_steps": 40000, "loss": 0.0557, "lr": 0.11809532294543279, "epoch": 1.1106197933207924, "percentage": 56.83, "elapsed_time": "1 day, 0:00:09", "remaining_time": "18:14:13", "throughput": 333.23, "total_tokens": 28794016} {"current_steps": 22735, "total_steps": 40000, "loss": 0.0886, "lr": 0.11803776840456245, "epoch": 1.1108640949844868, "percentage": 56.84, "elapsed_time": "1 day, 0:00:12", "remaining_time": "18:13:42", "throughput": 333.29, "total_tokens": 28800704} {"current_steps": 22740, "total_steps": 40000, "loss": 0.0651, "lr": 0.11798021879266997, "epoch": 1.1111083966481812, "percentage": 56.85, "elapsed_time": "1 day, 0:00:16", "remaining_time": "18:13:11", "throughput": 333.35, "total_tokens": 28807104} {"current_steps": 22745, "total_steps": 40000, "loss": 0.0668, "lr": 0.11792267411863006, "epoch": 1.1113526983118756, "percentage": 56.86, "elapsed_time": "1 day, 0:00:19", "remaining_time": "18:12:39", "throughput": 333.41, "total_tokens": 28813408} {"current_steps": 22750, "total_steps": 40000, "loss": 0.0553, "lr": 0.1178651343913169, "epoch": 1.11159699997557, "percentage": 56.88, "elapsed_time": "1 day, 0:00:22", "remaining_time": "18:12:08", "throughput": 333.47, "total_tokens": 28819584} {"current_steps": 22755, "total_steps": 40000, "loss": 0.0562, "lr": 0.11780759961960392, "epoch": 1.111841301639264, "percentage": 56.89, "elapsed_time": "1 day, 0:00:25", "remaining_time": "18:11:37", "throughput": 333.54, "total_tokens": 28825984} {"current_steps": 22760, "total_steps": 40000, "loss": 0.1025, "lr": 0.1177500698123636, "epoch": 1.1120856033029585, "percentage": 56.9, "elapsed_time": "1 day, 0:00:28", "remaining_time": "18:11:06", "throughput": 333.6, "total_tokens": 28832800} {"current_steps": 22765, "total_steps": 40000, "loss": 0.0776, "lr": 0.11769254497846778, "epoch": 1.1123299049666528, "percentage": 56.91, "elapsed_time": "1 day, 0:00:31", "remaining_time": "18:10:35", "throughput": 333.66, "total_tokens": 28839072} {"current_steps": 22770, "total_steps": 40000, "loss": 0.0513, "lr": 0.11763502512678758, "epoch": 1.1125742066303472, "percentage": 56.93, "elapsed_time": "1 day, 0:00:34", "remaining_time": "18:10:04", "throughput": 333.73, "total_tokens": 28845472} {"current_steps": 22775, "total_steps": 40000, "loss": 0.0795, "lr": 0.11757751026619315, "epoch": 1.1128185082940414, "percentage": 56.94, "elapsed_time": "1 day, 0:00:37", "remaining_time": "18:09:33", "throughput": 333.79, "total_tokens": 28852288} {"current_steps": 22780, "total_steps": 40000, "loss": 0.0457, "lr": 0.11752000040555416, "epoch": 1.1130628099577358, "percentage": 56.95, "elapsed_time": "1 day, 0:00:40", "remaining_time": "18:09:02", "throughput": 333.86, "total_tokens": 28858976} {"current_steps": 22785, "total_steps": 40000, "loss": 0.0406, "lr": 0.11746249555373921, "epoch": 1.1133071116214301, "percentage": 56.96, "elapsed_time": "1 day, 0:00:44", "remaining_time": "18:08:31", "throughput": 333.92, "total_tokens": 28865280} {"current_steps": 22790, "total_steps": 40000, "loss": 0.0642, "lr": 0.11740499571961638, "epoch": 1.1135514132851245, "percentage": 56.97, "elapsed_time": "1 day, 0:00:47", "remaining_time": "18:08:01", "throughput": 333.98, "total_tokens": 28871680} {"current_steps": 22795, "total_steps": 40000, "loss": 0.0506, "lr": 0.11734750091205279, "epoch": 1.113795714948819, "percentage": 56.99, "elapsed_time": "1 day, 0:00:50", "remaining_time": "18:07:30", "throughput": 334.04, "total_tokens": 28877920} {"current_steps": 22800, "total_steps": 40000, "loss": 0.0821, "lr": 0.11729001113991493, "epoch": 1.114040016612513, "percentage": 57.0, "elapsed_time": "1 day, 0:00:53", "remaining_time": "18:06:59", "throughput": 334.1, "total_tokens": 28884480} {"current_steps": 22800, "total_steps": 40000, "eval_loss": 0.06433244794607162, "epoch": 1.114040016612513, "percentage": 57.0, "elapsed_time": "1 day, 0:11:33", "remaining_time": "18:15:02", "throughput": 331.65, "total_tokens": 28884480} {"current_steps": 22805, "total_steps": 40000, "loss": 0.0805, "lr": 0.11723252641206837, "epoch": 1.1142843182762074, "percentage": 57.01, "elapsed_time": "1 day, 0:11:37", "remaining_time": "18:14:31", "throughput": 331.7, "total_tokens": 28890560} {"current_steps": 22810, "total_steps": 40000, "loss": 0.0628, "lr": 0.11717504673737808, "epoch": 1.1145286199399018, "percentage": 57.03, "elapsed_time": "1 day, 0:11:40", "remaining_time": "18:14:00", "throughput": 331.76, "total_tokens": 28896640} {"current_steps": 22815, "total_steps": 40000, "loss": 0.0542, "lr": 0.11711757212470802, "epoch": 1.1147729216035962, "percentage": 57.04, "elapsed_time": "1 day, 0:11:43", "remaining_time": "18:13:29", "throughput": 331.83, "total_tokens": 28903232} {"current_steps": 22820, "total_steps": 40000, "loss": 0.0307, "lr": 0.11706010258292165, "epoch": 1.1150172232672904, "percentage": 57.05, "elapsed_time": "1 day, 0:11:46", "remaining_time": "18:12:58", "throughput": 331.89, "total_tokens": 28909888} {"current_steps": 22825, "total_steps": 40000, "loss": 0.0697, "lr": 0.11700263812088131, "epoch": 1.1152615249309847, "percentage": 57.06, "elapsed_time": "1 day, 0:11:50", "remaining_time": "18:12:27", "throughput": 331.95, "total_tokens": 28916608} {"current_steps": 22830, "total_steps": 40000, "loss": 0.0575, "lr": 0.11694517874744892, "epoch": 1.1155058265946791, "percentage": 57.07, "elapsed_time": "1 day, 0:11:53", "remaining_time": "18:11:56", "throughput": 332.02, "total_tokens": 28923104} {"current_steps": 22835, "total_steps": 40000, "loss": 0.0576, "lr": 0.11688772447148532, "epoch": 1.1157501282583735, "percentage": 57.09, "elapsed_time": "1 day, 0:11:56", "remaining_time": "18:11:25", "throughput": 332.07, "total_tokens": 28928960} {"current_steps": 22840, "total_steps": 40000, "loss": 0.0755, "lr": 0.11683027530185074, "epoch": 1.1159944299220679, "percentage": 57.1, "elapsed_time": "1 day, 0:11:59", "remaining_time": "18:10:53", "throughput": 332.13, "total_tokens": 28935040} {"current_steps": 22845, "total_steps": 40000, "loss": 0.0442, "lr": 0.11677283124740451, "epoch": 1.116238731585762, "percentage": 57.11, "elapsed_time": "1 day, 0:12:02", "remaining_time": "18:10:22", "throughput": 332.19, "total_tokens": 28941600} {"current_steps": 22850, "total_steps": 40000, "loss": 0.055, "lr": 0.11671539231700531, "epoch": 1.1164830332494564, "percentage": 57.12, "elapsed_time": "1 day, 0:12:05", "remaining_time": "18:09:51", "throughput": 332.26, "total_tokens": 28947968} {"current_steps": 22855, "total_steps": 40000, "loss": 0.0418, "lr": 0.11665795851951084, "epoch": 1.1167273349131508, "percentage": 57.14, "elapsed_time": "1 day, 0:12:08", "remaining_time": "18:09:20", "throughput": 332.33, "total_tokens": 28955104} {"current_steps": 22860, "total_steps": 40000, "loss": 0.0673, "lr": 0.11660052986377825, "epoch": 1.1169716365768452, "percentage": 57.15, "elapsed_time": "1 day, 0:12:11", "remaining_time": "18:08:49", "throughput": 332.38, "total_tokens": 28961152} {"current_steps": 22865, "total_steps": 40000, "loss": 0.0532, "lr": 0.1165431063586636, "epoch": 1.1172159382405393, "percentage": 57.16, "elapsed_time": "1 day, 0:12:14", "remaining_time": "18:08:18", "throughput": 332.44, "total_tokens": 28967328} {"current_steps": 22870, "total_steps": 40000, "loss": 0.0456, "lr": 0.11648568801302245, "epoch": 1.1174602399042337, "percentage": 57.17, "elapsed_time": "1 day, 0:12:17", "remaining_time": "18:07:47", "throughput": 332.51, "total_tokens": 28974208} {"current_steps": 22875, "total_steps": 40000, "loss": 0.0441, "lr": 0.11642827483570937, "epoch": 1.117704541567928, "percentage": 57.19, "elapsed_time": "1 day, 0:12:21", "remaining_time": "18:07:16", "throughput": 332.57, "total_tokens": 28980736} {"current_steps": 22880, "total_steps": 40000, "loss": 0.0578, "lr": 0.11637086683557815, "epoch": 1.1179488432316225, "percentage": 57.2, "elapsed_time": "1 day, 0:12:24", "remaining_time": "18:06:45", "throughput": 332.63, "total_tokens": 28986912} {"current_steps": 22885, "total_steps": 40000, "loss": 0.0615, "lr": 0.11631346402148188, "epoch": 1.1181931448953168, "percentage": 57.21, "elapsed_time": "1 day, 0:12:27", "remaining_time": "18:06:14", "throughput": 332.69, "total_tokens": 28993248} {"current_steps": 22890, "total_steps": 40000, "loss": 0.0703, "lr": 0.11625606640227285, "epoch": 1.118437446559011, "percentage": 57.23, "elapsed_time": "1 day, 0:12:30", "remaining_time": "18:05:43", "throughput": 332.76, "total_tokens": 29000192} {"current_steps": 22895, "total_steps": 40000, "loss": 0.0445, "lr": 0.11619867398680238, "epoch": 1.1186817482227054, "percentage": 57.24, "elapsed_time": "1 day, 0:12:33", "remaining_time": "18:05:13", "throughput": 332.83, "total_tokens": 29006944} {"current_steps": 22900, "total_steps": 40000, "loss": 0.0456, "lr": 0.11614128678392119, "epoch": 1.1189260498863998, "percentage": 57.25, "elapsed_time": "1 day, 0:12:36", "remaining_time": "18:04:42", "throughput": 332.88, "total_tokens": 29012640} {"current_steps": 22905, "total_steps": 40000, "loss": 0.0589, "lr": 0.11608390480247906, "epoch": 1.1191703515500941, "percentage": 57.26, "elapsed_time": "1 day, 0:12:39", "remaining_time": "18:04:11", "throughput": 332.94, "total_tokens": 29018688} {"current_steps": 22910, "total_steps": 40000, "loss": 0.096, "lr": 0.11602652805132499, "epoch": 1.1194146532137883, "percentage": 57.27, "elapsed_time": "1 day, 0:12:42", "remaining_time": "18:03:40", "throughput": 333.0, "total_tokens": 29025440} {"current_steps": 22915, "total_steps": 40000, "loss": 0.0599, "lr": 0.11596915653930731, "epoch": 1.1196589548774827, "percentage": 57.29, "elapsed_time": "1 day, 0:12:45", "remaining_time": "18:03:09", "throughput": 333.07, "total_tokens": 29032032} {"current_steps": 22920, "total_steps": 40000, "loss": 0.0572, "lr": 0.11591179027527328, "epoch": 1.119903256541177, "percentage": 57.3, "elapsed_time": "1 day, 0:12:49", "remaining_time": "18:02:38", "throughput": 333.13, "total_tokens": 29038528} {"current_steps": 22925, "total_steps": 40000, "loss": 0.049, "lr": 0.11585442926806956, "epoch": 1.1201475582048714, "percentage": 57.31, "elapsed_time": "1 day, 0:12:52", "remaining_time": "18:02:07", "throughput": 333.19, "total_tokens": 29045344} {"current_steps": 22930, "total_steps": 40000, "loss": 0.0715, "lr": 0.11579707352654202, "epoch": 1.1203918598685658, "percentage": 57.33, "elapsed_time": "1 day, 0:12:55", "remaining_time": "18:01:36", "throughput": 333.26, "total_tokens": 29051776} {"current_steps": 22935, "total_steps": 40000, "loss": 0.0802, "lr": 0.11573972305953548, "epoch": 1.12063616153226, "percentage": 57.34, "elapsed_time": "1 day, 0:12:58", "remaining_time": "18:01:05", "throughput": 333.31, "total_tokens": 29057824} {"current_steps": 22940, "total_steps": 40000, "loss": 0.0651, "lr": 0.11568237787589426, "epoch": 1.1208804631959544, "percentage": 57.35, "elapsed_time": "1 day, 0:13:01", "remaining_time": "18:00:35", "throughput": 333.38, "total_tokens": 29064480} {"current_steps": 22945, "total_steps": 40000, "loss": 0.0741, "lr": 0.11562503798446161, "epoch": 1.1211247648596487, "percentage": 57.36, "elapsed_time": "1 day, 0:13:04", "remaining_time": "18:00:04", "throughput": 333.44, "total_tokens": 29070688} {"current_steps": 22950, "total_steps": 40000, "loss": 0.0565, "lr": 0.11556770339408005, "epoch": 1.1213690665233431, "percentage": 57.38, "elapsed_time": "1 day, 0:13:07", "remaining_time": "17:59:33", "throughput": 333.5, "total_tokens": 29076960} {"current_steps": 22955, "total_steps": 40000, "loss": 0.0707, "lr": 0.1155103741135914, "epoch": 1.1216133681870373, "percentage": 57.39, "elapsed_time": "1 day, 0:13:10", "remaining_time": "17:59:02", "throughput": 333.55, "total_tokens": 29082976} {"current_steps": 22960, "total_steps": 40000, "loss": 0.0554, "lr": 0.1154530501518364, "epoch": 1.1218576698507317, "percentage": 57.4, "elapsed_time": "1 day, 0:13:14", "remaining_time": "17:58:32", "throughput": 333.62, "total_tokens": 29089568} {"current_steps": 22965, "total_steps": 40000, "loss": 0.0717, "lr": 0.11539573151765523, "epoch": 1.122101971514426, "percentage": 57.41, "elapsed_time": "1 day, 0:13:17", "remaining_time": "17:58:01", "throughput": 333.68, "total_tokens": 29096064} {"current_steps": 22970, "total_steps": 40000, "loss": 0.062, "lr": 0.11533841821988719, "epoch": 1.1223462731781204, "percentage": 57.43, "elapsed_time": "1 day, 0:13:20", "remaining_time": "17:57:30", "throughput": 333.74, "total_tokens": 29102144} {"current_steps": 22975, "total_steps": 40000, "loss": 0.0646, "lr": 0.11528111026737059, "epoch": 1.1225905748418146, "percentage": 57.44, "elapsed_time": "1 day, 0:13:23", "remaining_time": "17:56:59", "throughput": 333.8, "total_tokens": 29108352} {"current_steps": 22980, "total_steps": 40000, "loss": 0.0778, "lr": 0.11522380766894312, "epoch": 1.122834876505509, "percentage": 57.45, "elapsed_time": "1 day, 0:13:26", "remaining_time": "17:56:28", "throughput": 333.86, "total_tokens": 29114944} {"current_steps": 22985, "total_steps": 40000, "loss": 0.0888, "lr": 0.11516651043344152, "epoch": 1.1230791781692033, "percentage": 57.46, "elapsed_time": "1 day, 0:13:29", "remaining_time": "17:55:58", "throughput": 333.93, "total_tokens": 29121568} {"current_steps": 22990, "total_steps": 40000, "loss": 0.0752, "lr": 0.11510921856970172, "epoch": 1.1233234798328977, "percentage": 57.48, "elapsed_time": "1 day, 0:13:32", "remaining_time": "17:55:27", "throughput": 333.99, "total_tokens": 29127904} {"current_steps": 22995, "total_steps": 40000, "loss": 0.0805, "lr": 0.11505193208655895, "epoch": 1.123567781496592, "percentage": 57.49, "elapsed_time": "1 day, 0:13:35", "remaining_time": "17:54:56", "throughput": 334.05, "total_tokens": 29134336} {"current_steps": 23000, "total_steps": 40000, "loss": 0.0826, "lr": 0.11499465099284738, "epoch": 1.1238120831602862, "percentage": 57.5, "elapsed_time": "1 day, 0:13:39", "remaining_time": "17:54:26", "throughput": 334.11, "total_tokens": 29140832} {"current_steps": 23000, "total_steps": 40000, "eval_loss": 0.06436285376548767, "epoch": 1.1238120831602862, "percentage": 57.5, "elapsed_time": "1 day, 0:24:19", "remaining_time": "18:02:19", "throughput": 331.68, "total_tokens": 29140832} {"current_steps": 23005, "total_steps": 40000, "loss": 0.0461, "lr": 0.1149373752974006, "epoch": 1.1240563848239806, "percentage": 57.51, "elapsed_time": "1 day, 0:24:23", "remaining_time": "18:01:49", "throughput": 331.73, "total_tokens": 29147328} {"current_steps": 23010, "total_steps": 40000, "loss": 0.0847, "lr": 0.11488010500905109, "epoch": 1.124300686487675, "percentage": 57.53, "elapsed_time": "1 day, 0:24:26", "remaining_time": "18:01:18", "throughput": 331.79, "total_tokens": 29153472} {"current_steps": 23015, "total_steps": 40000, "loss": 0.0524, "lr": 0.11482284013663077, "epoch": 1.1245449881513694, "percentage": 57.54, "elapsed_time": "1 day, 0:24:29", "remaining_time": "18:00:47", "throughput": 331.85, "total_tokens": 29159776} {"current_steps": 23020, "total_steps": 40000, "loss": 0.0707, "lr": 0.11476558068897061, "epoch": 1.1247892898150635, "percentage": 57.55, "elapsed_time": "1 day, 0:24:32", "remaining_time": "18:00:16", "throughput": 331.91, "total_tokens": 29165952} {"current_steps": 23025, "total_steps": 40000, "loss": 0.0545, "lr": 0.11470832667490061, "epoch": 1.125033591478758, "percentage": 57.56, "elapsed_time": "1 day, 0:24:35", "remaining_time": "17:59:45", "throughput": 331.97, "total_tokens": 29172416} {"current_steps": 23030, "total_steps": 40000, "loss": 0.0472, "lr": 0.11465107810325013, "epoch": 1.1252778931424523, "percentage": 57.57, "elapsed_time": "1 day, 0:24:38", "remaining_time": "17:59:14", "throughput": 332.04, "total_tokens": 29179232} {"current_steps": 23035, "total_steps": 40000, "loss": 0.0532, "lr": 0.11459383498284771, "epoch": 1.1255221948061467, "percentage": 57.59, "elapsed_time": "1 day, 0:24:41", "remaining_time": "17:58:43", "throughput": 332.1, "total_tokens": 29185376} {"current_steps": 23040, "total_steps": 40000, "loss": 0.0491, "lr": 0.11453659732252082, "epoch": 1.1257664964698408, "percentage": 57.6, "elapsed_time": "1 day, 0:24:44", "remaining_time": "17:58:13", "throughput": 332.16, "total_tokens": 29191584} {"current_steps": 23045, "total_steps": 40000, "loss": 0.0545, "lr": 0.11447936513109633, "epoch": 1.1260107981335352, "percentage": 57.61, "elapsed_time": "1 day, 0:24:48", "remaining_time": "17:57:42", "throughput": 332.22, "total_tokens": 29198176} {"current_steps": 23050, "total_steps": 40000, "loss": 0.0404, "lr": 0.11442213841740011, "epoch": 1.1262550997972296, "percentage": 57.63, "elapsed_time": "1 day, 0:24:51", "remaining_time": "17:57:11", "throughput": 332.28, "total_tokens": 29204672} {"current_steps": 23055, "total_steps": 40000, "loss": 0.0477, "lr": 0.1143649171902572, "epoch": 1.126499401460924, "percentage": 57.64, "elapsed_time": "1 day, 0:24:54", "remaining_time": "17:56:40", "throughput": 332.34, "total_tokens": 29211040} {"current_steps": 23060, "total_steps": 40000, "loss": 0.0808, "lr": 0.11430770145849194, "epoch": 1.1267437031246184, "percentage": 57.65, "elapsed_time": "1 day, 0:24:57", "remaining_time": "17:56:09", "throughput": 332.41, "total_tokens": 29217920} {"current_steps": 23065, "total_steps": 40000, "loss": 0.0939, "lr": 0.11425049123092756, "epoch": 1.1269880047883125, "percentage": 57.66, "elapsed_time": "1 day, 0:25:00", "remaining_time": "17:55:39", "throughput": 332.47, "total_tokens": 29224352} {"current_steps": 23070, "total_steps": 40000, "loss": 0.073, "lr": 0.11419328651638674, "epoch": 1.127232306452007, "percentage": 57.67, "elapsed_time": "1 day, 0:25:03", "remaining_time": "17:55:08", "throughput": 332.52, "total_tokens": 29230016} {"current_steps": 23075, "total_steps": 40000, "loss": 0.04, "lr": 0.11413608732369115, "epoch": 1.1274766081157013, "percentage": 57.69, "elapsed_time": "1 day, 0:25:06", "remaining_time": "17:54:37", "throughput": 332.59, "total_tokens": 29237152} {"current_steps": 23080, "total_steps": 40000, "loss": 0.1017, "lr": 0.11407889366166153, "epoch": 1.1277209097793957, "percentage": 57.7, "elapsed_time": "1 day, 0:25:09", "remaining_time": "17:54:06", "throughput": 332.65, "total_tokens": 29243456} {"current_steps": 23085, "total_steps": 40000, "loss": 0.0464, "lr": 0.11402170553911797, "epoch": 1.1279652114430898, "percentage": 57.71, "elapsed_time": "1 day, 0:25:12", "remaining_time": "17:53:36", "throughput": 332.71, "total_tokens": 29249824} {"current_steps": 23090, "total_steps": 40000, "loss": 0.0448, "lr": 0.11396452296487955, "epoch": 1.1282095131067842, "percentage": 57.73, "elapsed_time": "1 day, 0:25:16", "remaining_time": "17:53:05", "throughput": 332.78, "total_tokens": 29256544} {"current_steps": 23095, "total_steps": 40000, "loss": 0.0571, "lr": 0.11390734594776449, "epoch": 1.1284538147704786, "percentage": 57.74, "elapsed_time": "1 day, 0:25:19", "remaining_time": "17:52:34", "throughput": 332.84, "total_tokens": 29263008} {"current_steps": 23100, "total_steps": 40000, "loss": 0.056, "lr": 0.11385017449659031, "epoch": 1.128698116434173, "percentage": 57.75, "elapsed_time": "1 day, 0:25:22", "remaining_time": "17:52:04", "throughput": 332.9, "total_tokens": 29269280} {"current_steps": 23105, "total_steps": 40000, "loss": 0.0469, "lr": 0.11379300862017344, "epoch": 1.1289424180978673, "percentage": 57.76, "elapsed_time": "1 day, 0:25:25", "remaining_time": "17:51:33", "throughput": 332.96, "total_tokens": 29275552} {"current_steps": 23110, "total_steps": 40000, "loss": 0.0825, "lr": 0.11373584832732966, "epoch": 1.1291867197615615, "percentage": 57.77, "elapsed_time": "1 day, 0:25:28", "remaining_time": "17:51:02", "throughput": 333.02, "total_tokens": 29281632} {"current_steps": 23115, "total_steps": 40000, "loss": 0.0769, "lr": 0.11367869362687386, "epoch": 1.1294310214252559, "percentage": 57.79, "elapsed_time": "1 day, 0:25:31", "remaining_time": "17:50:32", "throughput": 333.08, "total_tokens": 29287936} {"current_steps": 23120, "total_steps": 40000, "loss": 0.0616, "lr": 0.11362154452761988, "epoch": 1.1296753230889502, "percentage": 57.8, "elapsed_time": "1 day, 0:25:34", "remaining_time": "17:50:01", "throughput": 333.13, "total_tokens": 29293792} {"current_steps": 23125, "total_steps": 40000, "loss": 0.0637, "lr": 0.11356440103838095, "epoch": 1.1299196247526446, "percentage": 57.81, "elapsed_time": "1 day, 0:25:37", "remaining_time": "17:49:30", "throughput": 333.19, "total_tokens": 29300160} {"current_steps": 23130, "total_steps": 40000, "loss": 0.0817, "lr": 0.11350726316796922, "epoch": 1.1301639264163388, "percentage": 57.83, "elapsed_time": "1 day, 0:25:40", "remaining_time": "17:49:00", "throughput": 333.25, "total_tokens": 29306528} {"current_steps": 23135, "total_steps": 40000, "loss": 0.0764, "lr": 0.11345013092519607, "epoch": 1.1304082280800332, "percentage": 57.84, "elapsed_time": "1 day, 0:25:43", "remaining_time": "17:48:29", "throughput": 333.31, "total_tokens": 29312960} {"current_steps": 23140, "total_steps": 40000, "loss": 0.0534, "lr": 0.11339300431887213, "epoch": 1.1306525297437275, "percentage": 57.85, "elapsed_time": "1 day, 0:25:46", "remaining_time": "17:47:58", "throughput": 333.38, "total_tokens": 29319424} {"current_steps": 23145, "total_steps": 40000, "loss": 0.0432, "lr": 0.11333588335780687, "epoch": 1.130896831407422, "percentage": 57.86, "elapsed_time": "1 day, 0:25:50", "remaining_time": "17:47:28", "throughput": 333.44, "total_tokens": 29325696} {"current_steps": 23150, "total_steps": 40000, "loss": 0.0554, "lr": 0.11327876805080916, "epoch": 1.1311411330711163, "percentage": 57.88, "elapsed_time": "1 day, 0:25:53", "remaining_time": "17:46:57", "throughput": 333.49, "total_tokens": 29331808} {"current_steps": 23155, "total_steps": 40000, "loss": 0.0543, "lr": 0.11322165840668696, "epoch": 1.1313854347348105, "percentage": 57.89, "elapsed_time": "1 day, 0:25:56", "remaining_time": "17:46:27", "throughput": 333.56, "total_tokens": 29338304} {"current_steps": 23160, "total_steps": 40000, "loss": 0.0238, "lr": 0.11316455443424717, "epoch": 1.1316297363985048, "percentage": 57.9, "elapsed_time": "1 day, 0:25:59", "remaining_time": "17:45:56", "throughput": 333.61, "total_tokens": 29344256} {"current_steps": 23165, "total_steps": 40000, "loss": 0.0515, "lr": 0.11310745614229603, "epoch": 1.1318740380621992, "percentage": 57.91, "elapsed_time": "1 day, 0:26:02", "remaining_time": "17:45:26", "throughput": 333.67, "total_tokens": 29350720} {"current_steps": 23170, "total_steps": 40000, "loss": 0.0708, "lr": 0.1130503635396387, "epoch": 1.1321183397258936, "percentage": 57.93, "elapsed_time": "1 day, 0:26:05", "remaining_time": "17:44:55", "throughput": 333.73, "total_tokens": 29357024} {"current_steps": 23175, "total_steps": 40000, "loss": 0.0311, "lr": 0.11299327663507966, "epoch": 1.1323626413895878, "percentage": 57.94, "elapsed_time": "1 day, 0:26:08", "remaining_time": "17:44:25", "throughput": 333.8, "total_tokens": 29364224} {"current_steps": 23180, "total_steps": 40000, "loss": 0.0568, "lr": 0.11293619543742246, "epoch": 1.1326069430532821, "percentage": 57.95, "elapsed_time": "1 day, 0:26:11", "remaining_time": "17:43:54", "throughput": 333.87, "total_tokens": 29371168} {"current_steps": 23185, "total_steps": 40000, "loss": 0.0399, "lr": 0.11287911995546965, "epoch": 1.1328512447169765, "percentage": 57.96, "elapsed_time": "1 day, 0:26:15", "remaining_time": "17:43:24", "throughput": 333.93, "total_tokens": 29377408} {"current_steps": 23190, "total_steps": 40000, "loss": 0.0396, "lr": 0.11282205019802308, "epoch": 1.133095546380671, "percentage": 57.98, "elapsed_time": "1 day, 0:26:18", "remaining_time": "17:42:53", "throughput": 333.99, "total_tokens": 29383936} {"current_steps": 23195, "total_steps": 40000, "loss": 0.0845, "lr": 0.11276498617388354, "epoch": 1.1333398480443653, "percentage": 57.99, "elapsed_time": "1 day, 0:26:21", "remaining_time": "17:42:23", "throughput": 334.06, "total_tokens": 29390912} {"current_steps": 23200, "total_steps": 40000, "loss": 0.0514, "lr": 0.11270792789185109, "epoch": 1.1335841497080594, "percentage": 58.0, "elapsed_time": "1 day, 0:26:24", "remaining_time": "17:41:52", "throughput": 334.12, "total_tokens": 29396960} {"current_steps": 23200, "total_steps": 40000, "eval_loss": 0.06410333514213562, "epoch": 1.1335841497080594, "percentage": 58.0, "elapsed_time": "1 day, 0:37:04", "remaining_time": "17:49:36", "throughput": 331.7, "total_tokens": 29396960} {"current_steps": 23205, "total_steps": 40000, "loss": 0.0526, "lr": 0.11265087536072482, "epoch": 1.1338284513717538, "percentage": 58.01, "elapsed_time": "1 day, 0:37:10", "remaining_time": "17:49:07", "throughput": 331.76, "total_tokens": 29403552} {"current_steps": 23210, "total_steps": 40000, "loss": 0.0744, "lr": 0.11259382858930288, "epoch": 1.1340727530354482, "percentage": 58.03, "elapsed_time": "1 day, 0:37:13", "remaining_time": "17:48:36", "throughput": 331.81, "total_tokens": 29409792} {"current_steps": 23215, "total_steps": 40000, "loss": 0.0514, "lr": 0.11253678758638262, "epoch": 1.1343170546991426, "percentage": 58.04, "elapsed_time": "1 day, 0:37:16", "remaining_time": "17:48:06", "throughput": 331.87, "total_tokens": 29415872} {"current_steps": 23220, "total_steps": 40000, "loss": 0.072, "lr": 0.11247975236076059, "epoch": 1.1345613563628367, "percentage": 58.05, "elapsed_time": "1 day, 0:37:19", "remaining_time": "17:47:35", "throughput": 331.93, "total_tokens": 29422496} {"current_steps": 23225, "total_steps": 40000, "loss": 0.0425, "lr": 0.11242272292123218, "epoch": 1.134805658026531, "percentage": 58.06, "elapsed_time": "1 day, 0:37:22", "remaining_time": "17:47:04", "throughput": 331.99, "total_tokens": 29428512} {"current_steps": 23230, "total_steps": 40000, "loss": 0.0385, "lr": 0.11236569927659217, "epoch": 1.1350499596902255, "percentage": 58.07, "elapsed_time": "1 day, 0:37:25", "remaining_time": "17:46:34", "throughput": 332.04, "total_tokens": 29434272} {"current_steps": 23235, "total_steps": 40000, "loss": 0.0435, "lr": 0.11230868143563429, "epoch": 1.1352942613539199, "percentage": 58.09, "elapsed_time": "1 day, 0:37:28", "remaining_time": "17:46:03", "throughput": 332.1, "total_tokens": 29440640} {"current_steps": 23240, "total_steps": 40000, "loss": 0.0669, "lr": 0.11225166940715131, "epoch": 1.1355385630176142, "percentage": 58.1, "elapsed_time": "1 day, 0:37:31", "remaining_time": "17:45:33", "throughput": 332.17, "total_tokens": 29447168} {"current_steps": 23245, "total_steps": 40000, "loss": 0.066, "lr": 0.11219466319993537, "epoch": 1.1357828646813084, "percentage": 58.11, "elapsed_time": "1 day, 0:37:34", "remaining_time": "17:45:02", "throughput": 332.22, "total_tokens": 29453312} {"current_steps": 23250, "total_steps": 40000, "loss": 0.0628, "lr": 0.11213766282277739, "epoch": 1.1360271663450028, "percentage": 58.13, "elapsed_time": "1 day, 0:37:37", "remaining_time": "17:44:31", "throughput": 332.28, "total_tokens": 29459552} {"current_steps": 23255, "total_steps": 40000, "loss": 0.0502, "lr": 0.11208066828446761, "epoch": 1.1362714680086972, "percentage": 58.14, "elapsed_time": "1 day, 0:37:41", "remaining_time": "17:44:01", "throughput": 332.35, "total_tokens": 29466464} {"current_steps": 23260, "total_steps": 40000, "loss": 0.0463, "lr": 0.11202367959379537, "epoch": 1.1365157696723915, "percentage": 58.15, "elapsed_time": "1 day, 0:37:44", "remaining_time": "17:43:30", "throughput": 332.41, "total_tokens": 29472800} {"current_steps": 23265, "total_steps": 40000, "loss": 0.0484, "lr": 0.11196669675954894, "epoch": 1.1367600713360857, "percentage": 58.16, "elapsed_time": "1 day, 0:37:47", "remaining_time": "17:43:00", "throughput": 332.47, "total_tokens": 29479136} {"current_steps": 23270, "total_steps": 40000, "loss": 0.0562, "lr": 0.1119097197905158, "epoch": 1.13700437299978, "percentage": 58.17, "elapsed_time": "1 day, 0:37:50", "remaining_time": "17:42:29", "throughput": 332.53, "total_tokens": 29485248} {"current_steps": 23275, "total_steps": 40000, "loss": 0.0409, "lr": 0.11185274869548259, "epoch": 1.1372486746634745, "percentage": 58.19, "elapsed_time": "1 day, 0:37:53", "remaining_time": "17:41:59", "throughput": 332.58, "total_tokens": 29491296} {"current_steps": 23280, "total_steps": 40000, "loss": 0.0717, "lr": 0.11179578348323486, "epoch": 1.1374929763271688, "percentage": 58.2, "elapsed_time": "1 day, 0:37:56", "remaining_time": "17:41:28", "throughput": 332.64, "total_tokens": 29497440} {"current_steps": 23285, "total_steps": 40000, "loss": 0.0613, "lr": 0.1117388241625575, "epoch": 1.1377372779908632, "percentage": 58.21, "elapsed_time": "1 day, 0:37:59", "remaining_time": "17:40:58", "throughput": 332.7, "total_tokens": 29503488} {"current_steps": 23290, "total_steps": 40000, "loss": 0.0555, "lr": 0.11168187074223421, "epoch": 1.1379815796545574, "percentage": 58.23, "elapsed_time": "1 day, 0:38:02", "remaining_time": "17:40:27", "throughput": 332.76, "total_tokens": 29509952} {"current_steps": 23295, "total_steps": 40000, "loss": 0.0759, "lr": 0.11162492323104796, "epoch": 1.1382258813182518, "percentage": 58.24, "elapsed_time": "1 day, 0:38:05", "remaining_time": "17:39:57", "throughput": 332.81, "total_tokens": 29515744} {"current_steps": 23300, "total_steps": 40000, "loss": 0.0469, "lr": 0.11156798163778091, "epoch": 1.1384701829819461, "percentage": 58.25, "elapsed_time": "1 day, 0:38:08", "remaining_time": "17:39:26", "throughput": 332.87, "total_tokens": 29521632} {"current_steps": 23305, "total_steps": 40000, "loss": 0.0351, "lr": 0.11151104597121399, "epoch": 1.1387144846456405, "percentage": 58.26, "elapsed_time": "1 day, 0:38:11", "remaining_time": "17:38:56", "throughput": 332.93, "total_tokens": 29528352} {"current_steps": 23310, "total_steps": 40000, "loss": 0.0629, "lr": 0.11145411624012742, "epoch": 1.1389587863093347, "percentage": 58.27, "elapsed_time": "1 day, 0:38:14", "remaining_time": "17:38:25", "throughput": 332.99, "total_tokens": 29534720} {"current_steps": 23315, "total_steps": 40000, "loss": 0.0661, "lr": 0.11139719245330063, "epoch": 1.139203087973029, "percentage": 58.29, "elapsed_time": "1 day, 0:38:17", "remaining_time": "17:37:55", "throughput": 333.05, "total_tokens": 29540896} {"current_steps": 23320, "total_steps": 40000, "loss": 0.0861, "lr": 0.11134027461951179, "epoch": 1.1394473896367234, "percentage": 58.3, "elapsed_time": "1 day, 0:38:21", "remaining_time": "17:37:24", "throughput": 333.11, "total_tokens": 29547200} {"current_steps": 23325, "total_steps": 40000, "loss": 0.0317, "lr": 0.11128336274753849, "epoch": 1.1396916913004178, "percentage": 58.31, "elapsed_time": "1 day, 0:38:24", "remaining_time": "17:36:54", "throughput": 333.17, "total_tokens": 29553504} {"current_steps": 23330, "total_steps": 40000, "loss": 0.0622, "lr": 0.11122645684615715, "epoch": 1.1399359929641122, "percentage": 58.33, "elapsed_time": "1 day, 0:38:27", "remaining_time": "17:36:24", "throughput": 333.23, "total_tokens": 29559936} {"current_steps": 23335, "total_steps": 40000, "loss": 0.0482, "lr": 0.11116955692414345, "epoch": 1.1401802946278063, "percentage": 58.34, "elapsed_time": "1 day, 0:38:30", "remaining_time": "17:35:53", "throughput": 333.29, "total_tokens": 29566496} {"current_steps": 23340, "total_steps": 40000, "loss": 0.0703, "lr": 0.11111266299027203, "epoch": 1.1404245962915007, "percentage": 58.35, "elapsed_time": "1 day, 0:38:33", "remaining_time": "17:35:23", "throughput": 333.35, "total_tokens": 29572512} {"current_steps": 23345, "total_steps": 40000, "loss": 0.0544, "lr": 0.11105577505331668, "epoch": 1.140668897955195, "percentage": 58.36, "elapsed_time": "1 day, 0:38:36", "remaining_time": "17:34:52", "throughput": 333.41, "total_tokens": 29578496} {"current_steps": 23350, "total_steps": 40000, "loss": 0.0548, "lr": 0.11099889312205018, "epoch": 1.1409131996188895, "percentage": 58.38, "elapsed_time": "1 day, 0:38:39", "remaining_time": "17:34:22", "throughput": 333.47, "total_tokens": 29584928} {"current_steps": 23355, "total_steps": 40000, "loss": 0.0565, "lr": 0.11094201720524455, "epoch": 1.1411575012825836, "percentage": 58.39, "elapsed_time": "1 day, 0:38:42", "remaining_time": "17:33:52", "throughput": 333.52, "total_tokens": 29591072} {"current_steps": 23360, "total_steps": 40000, "loss": 0.0368, "lr": 0.11088514731167064, "epoch": 1.141401802946278, "percentage": 58.4, "elapsed_time": "1 day, 0:38:45", "remaining_time": "17:33:21", "throughput": 333.58, "total_tokens": 29596864} {"current_steps": 23365, "total_steps": 40000, "loss": 0.0361, "lr": 0.11082828345009862, "epoch": 1.1416461046099724, "percentage": 58.41, "elapsed_time": "1 day, 0:38:48", "remaining_time": "17:32:51", "throughput": 333.64, "total_tokens": 29603776} {"current_steps": 23370, "total_steps": 40000, "loss": 0.0774, "lr": 0.11077142562929748, "epoch": 1.1418904062736668, "percentage": 58.43, "elapsed_time": "1 day, 0:38:51", "remaining_time": "17:32:21", "throughput": 333.7, "total_tokens": 29609888} {"current_steps": 23375, "total_steps": 40000, "loss": 0.0892, "lr": 0.11071457385803554, "epoch": 1.1421347079373612, "percentage": 58.44, "elapsed_time": "1 day, 0:38:54", "remaining_time": "17:31:50", "throughput": 333.76, "total_tokens": 29616192} {"current_steps": 23380, "total_steps": 40000, "loss": 0.0804, "lr": 0.11065772814508001, "epoch": 1.1423790096010553, "percentage": 58.45, "elapsed_time": "1 day, 0:38:58", "remaining_time": "17:31:20", "throughput": 333.82, "total_tokens": 29622560} {"current_steps": 23385, "total_steps": 40000, "loss": 0.0631, "lr": 0.11060088849919715, "epoch": 1.1426233112647497, "percentage": 58.46, "elapsed_time": "1 day, 0:39:01", "remaining_time": "17:30:50", "throughput": 333.88, "total_tokens": 29628448} {"current_steps": 23390, "total_steps": 40000, "loss": 0.0364, "lr": 0.11054405492915244, "epoch": 1.142867612928444, "percentage": 58.48, "elapsed_time": "1 day, 0:39:04", "remaining_time": "17:30:20", "throughput": 333.94, "total_tokens": 29635168} {"current_steps": 23395, "total_steps": 40000, "loss": 0.067, "lr": 0.11048722744371031, "epoch": 1.1431119145921385, "percentage": 58.49, "elapsed_time": "1 day, 0:39:07", "remaining_time": "17:29:49", "throughput": 334.0, "total_tokens": 29641504} {"current_steps": 23400, "total_steps": 40000, "loss": 0.0517, "lr": 0.1104304060516342, "epoch": 1.1433562162558326, "percentage": 58.5, "elapsed_time": "1 day, 0:39:10", "remaining_time": "17:29:19", "throughput": 334.06, "total_tokens": 29648032} {"current_steps": 23400, "total_steps": 40000, "eval_loss": 0.0638449415564537, "epoch": 1.1433562162558326, "percentage": 58.5, "elapsed_time": "1 day, 0:49:51", "remaining_time": "17:36:54", "throughput": 331.67, "total_tokens": 29648032} {"current_steps": 23405, "total_steps": 40000, "loss": 0.0446, "lr": 0.11037359076168682, "epoch": 1.143600517919527, "percentage": 58.51, "elapsed_time": "1 day, 0:49:54", "remaining_time": "17:36:24", "throughput": 331.72, "total_tokens": 29654368} {"current_steps": 23410, "total_steps": 40000, "loss": 0.0498, "lr": 0.11031678158262966, "epoch": 1.1438448195832214, "percentage": 58.53, "elapsed_time": "1 day, 0:49:57", "remaining_time": "17:35:53", "throughput": 331.78, "total_tokens": 29660576} {"current_steps": 23415, "total_steps": 40000, "loss": 0.05, "lr": 0.11025997852322349, "epoch": 1.1440891212469158, "percentage": 58.54, "elapsed_time": "1 day, 0:50:01", "remaining_time": "17:35:23", "throughput": 331.84, "total_tokens": 29667136} {"current_steps": 23420, "total_steps": 40000, "loss": 0.0885, "lr": 0.11020318159222807, "epoch": 1.1443334229106101, "percentage": 58.55, "elapsed_time": "1 day, 0:50:04", "remaining_time": "17:34:52", "throughput": 331.9, "total_tokens": 29673376} {"current_steps": 23425, "total_steps": 40000, "loss": 0.0597, "lr": 0.1101463907984021, "epoch": 1.1445777245743043, "percentage": 58.56, "elapsed_time": "1 day, 0:50:07", "remaining_time": "17:34:22", "throughput": 331.96, "total_tokens": 29679488} {"current_steps": 23430, "total_steps": 40000, "loss": 0.0625, "lr": 0.11008960615050352, "epoch": 1.1448220262379987, "percentage": 58.58, "elapsed_time": "1 day, 0:50:10", "remaining_time": "17:33:52", "throughput": 332.01, "total_tokens": 29684992} {"current_steps": 23435, "total_steps": 40000, "loss": 0.0866, "lr": 0.11003282765728925, "epoch": 1.145066327901693, "percentage": 58.59, "elapsed_time": "1 day, 0:50:13", "remaining_time": "17:33:21", "throughput": 332.07, "total_tokens": 29691072} {"current_steps": 23440, "total_steps": 40000, "loss": 0.0541, "lr": 0.10997605532751518, "epoch": 1.1453106295653874, "percentage": 58.6, "elapsed_time": "1 day, 0:50:16", "remaining_time": "17:32:51", "throughput": 332.12, "total_tokens": 29697312} {"current_steps": 23445, "total_steps": 40000, "loss": 0.0697, "lr": 0.1099192891699364, "epoch": 1.1455549312290816, "percentage": 58.61, "elapsed_time": "1 day, 0:50:19", "remaining_time": "17:32:20", "throughput": 332.18, "total_tokens": 29703808} {"current_steps": 23450, "total_steps": 40000, "loss": 0.071, "lr": 0.10986252919330687, "epoch": 1.145799232892776, "percentage": 58.63, "elapsed_time": "1 day, 0:50:22", "remaining_time": "17:31:50", "throughput": 332.24, "total_tokens": 29709888} {"current_steps": 23455, "total_steps": 40000, "loss": 0.0765, "lr": 0.10980577540637973, "epoch": 1.1460435345564703, "percentage": 58.64, "elapsed_time": "1 day, 0:50:25", "remaining_time": "17:31:20", "throughput": 332.3, "total_tokens": 29716032} {"current_steps": 23460, "total_steps": 40000, "loss": 0.0526, "lr": 0.10974902781790719, "epoch": 1.1462878362201647, "percentage": 58.65, "elapsed_time": "1 day, 0:50:28", "remaining_time": "17:30:49", "throughput": 332.36, "total_tokens": 29722720} {"current_steps": 23465, "total_steps": 40000, "loss": 0.0748, "lr": 0.10969228643664032, "epoch": 1.146532137883859, "percentage": 58.66, "elapsed_time": "1 day, 0:50:31", "remaining_time": "17:30:19", "throughput": 332.42, "total_tokens": 29728928} {"current_steps": 23470, "total_steps": 40000, "loss": 0.0876, "lr": 0.10963555127132942, "epoch": 1.1467764395475533, "percentage": 58.67, "elapsed_time": "1 day, 0:50:34", "remaining_time": "17:29:49", "throughput": 332.48, "total_tokens": 29735168} {"current_steps": 23475, "total_steps": 40000, "loss": 0.057, "lr": 0.10957882233072382, "epoch": 1.1470207412112476, "percentage": 58.69, "elapsed_time": "1 day, 0:50:37", "remaining_time": "17:29:18", "throughput": 332.53, "total_tokens": 29741088} {"current_steps": 23480, "total_steps": 40000, "loss": 0.0365, "lr": 0.10952209962357176, "epoch": 1.147265042874942, "percentage": 58.7, "elapsed_time": "1 day, 0:50:40", "remaining_time": "17:28:48", "throughput": 332.59, "total_tokens": 29747328} {"current_steps": 23485, "total_steps": 40000, "loss": 0.0497, "lr": 0.10946538315862062, "epoch": 1.1475093445386364, "percentage": 58.71, "elapsed_time": "1 day, 0:50:43", "remaining_time": "17:28:18", "throughput": 332.65, "total_tokens": 29753792} {"current_steps": 23490, "total_steps": 40000, "loss": 0.08, "lr": 0.10940867294461679, "epoch": 1.1477536462023306, "percentage": 58.73, "elapsed_time": "1 day, 0:50:47", "remaining_time": "17:27:48", "throughput": 332.71, "total_tokens": 29760288} {"current_steps": 23495, "total_steps": 40000, "loss": 0.0947, "lr": 0.10935196899030565, "epoch": 1.147997947866025, "percentage": 58.74, "elapsed_time": "1 day, 0:50:50", "remaining_time": "17:27:17", "throughput": 332.77, "total_tokens": 29766144} {"current_steps": 23500, "total_steps": 40000, "loss": 0.0545, "lr": 0.10929527130443177, "epoch": 1.1482422495297193, "percentage": 58.75, "elapsed_time": "1 day, 0:50:53", "remaining_time": "17:26:47", "throughput": 332.83, "total_tokens": 29772800} {"current_steps": 23505, "total_steps": 40000, "loss": 0.0746, "lr": 0.1092385798957385, "epoch": 1.1484865511934137, "percentage": 58.76, "elapsed_time": "1 day, 0:50:56", "remaining_time": "17:26:17", "throughput": 332.89, "total_tokens": 29778752} {"current_steps": 23510, "total_steps": 40000, "loss": 0.0453, "lr": 0.10918189477296848, "epoch": 1.148730852857108, "percentage": 58.77, "elapsed_time": "1 day, 0:50:59", "remaining_time": "17:25:47", "throughput": 332.94, "total_tokens": 29784960} {"current_steps": 23515, "total_steps": 40000, "loss": 0.0606, "lr": 0.1091252159448633, "epoch": 1.1489751545208022, "percentage": 58.79, "elapsed_time": "1 day, 0:51:02", "remaining_time": "17:25:16", "throughput": 333.0, "total_tokens": 29791296} {"current_steps": 23520, "total_steps": 40000, "loss": 0.0848, "lr": 0.10906854342016345, "epoch": 1.1492194561844966, "percentage": 58.8, "elapsed_time": "1 day, 0:51:05", "remaining_time": "17:24:46", "throughput": 333.06, "total_tokens": 29797376} {"current_steps": 23525, "total_steps": 40000, "loss": 0.0663, "lr": 0.10901187720760858, "epoch": 1.149463757848191, "percentage": 58.81, "elapsed_time": "1 day, 0:51:08", "remaining_time": "17:24:16", "throughput": 333.12, "total_tokens": 29803328} {"current_steps": 23530, "total_steps": 40000, "loss": 0.075, "lr": 0.10895521731593734, "epoch": 1.1497080595118854, "percentage": 58.83, "elapsed_time": "1 day, 0:51:11", "remaining_time": "17:23:46", "throughput": 333.17, "total_tokens": 29809408} {"current_steps": 23535, "total_steps": 40000, "loss": 0.0846, "lr": 0.10889856375388733, "epoch": 1.1499523611755795, "percentage": 58.84, "elapsed_time": "1 day, 0:51:14", "remaining_time": "17:23:16", "throughput": 333.23, "total_tokens": 29815360} {"current_steps": 23540, "total_steps": 40000, "loss": 0.062, "lr": 0.1088419165301954, "epoch": 1.150196662839274, "percentage": 58.85, "elapsed_time": "1 day, 0:51:17", "remaining_time": "17:22:45", "throughput": 333.29, "total_tokens": 29821696} {"current_steps": 23545, "total_steps": 40000, "loss": 0.0505, "lr": 0.1087852756535971, "epoch": 1.1504409645029683, "percentage": 58.86, "elapsed_time": "1 day, 0:51:20", "remaining_time": "17:22:15", "throughput": 333.34, "total_tokens": 29827808} {"current_steps": 23550, "total_steps": 40000, "loss": 0.0783, "lr": 0.10872864113282725, "epoch": 1.1506852661666627, "percentage": 58.88, "elapsed_time": "1 day, 0:51:23", "remaining_time": "17:21:45", "throughput": 333.4, "total_tokens": 29833728} {"current_steps": 23555, "total_steps": 40000, "loss": 0.0401, "lr": 0.10867201297661958, "epoch": 1.150929567830357, "percentage": 58.89, "elapsed_time": "1 day, 0:51:26", "remaining_time": "17:21:15", "throughput": 333.46, "total_tokens": 29840096} {"current_steps": 23560, "total_steps": 40000, "loss": 0.0823, "lr": 0.10861539119370689, "epoch": 1.1511738694940512, "percentage": 58.9, "elapsed_time": "1 day, 0:51:29", "remaining_time": "17:20:45", "throughput": 333.52, "total_tokens": 29847040} {"current_steps": 23565, "total_steps": 40000, "loss": 0.0432, "lr": 0.10855877579282096, "epoch": 1.1514181711577456, "percentage": 58.91, "elapsed_time": "1 day, 0:51:33", "remaining_time": "17:20:15", "throughput": 333.59, "total_tokens": 29853728} {"current_steps": 23570, "total_steps": 40000, "loss": 0.0684, "lr": 0.10850216678269252, "epoch": 1.15166247282144, "percentage": 58.93, "elapsed_time": "1 day, 0:51:36", "remaining_time": "17:19:45", "throughput": 333.65, "total_tokens": 29860192} {"current_steps": 23575, "total_steps": 40000, "loss": 0.0458, "lr": 0.10844556417205146, "epoch": 1.1519067744851341, "percentage": 58.94, "elapsed_time": "1 day, 0:51:39", "remaining_time": "17:19:15", "throughput": 333.7, "total_tokens": 29866208} {"current_steps": 23580, "total_steps": 40000, "loss": 0.0485, "lr": 0.10838896796962669, "epoch": 1.1521510761488285, "percentage": 58.95, "elapsed_time": "1 day, 0:51:42", "remaining_time": "17:18:45", "throughput": 333.76, "total_tokens": 29872288} {"current_steps": 23585, "total_steps": 40000, "loss": 0.0679, "lr": 0.1083323781841459, "epoch": 1.1523953778125229, "percentage": 58.96, "elapsed_time": "1 day, 0:51:45", "remaining_time": "17:18:15", "throughput": 333.82, "total_tokens": 29878464} {"current_steps": 23590, "total_steps": 40000, "loss": 0.0457, "lr": 0.10827579482433607, "epoch": 1.1526396794762173, "percentage": 58.98, "elapsed_time": "1 day, 0:51:48", "remaining_time": "17:17:45", "throughput": 333.88, "total_tokens": 29884704} {"current_steps": 23595, "total_steps": 40000, "loss": 0.083, "lr": 0.10821921789892304, "epoch": 1.1528839811399116, "percentage": 58.99, "elapsed_time": "1 day, 0:51:51", "remaining_time": "17:17:15", "throughput": 333.93, "total_tokens": 29891008} {"current_steps": 23600, "total_steps": 40000, "loss": 0.0477, "lr": 0.10816264741663158, "epoch": 1.1531282828036058, "percentage": 59.0, "elapsed_time": "1 day, 0:51:54", "remaining_time": "17:16:45", "throughput": 333.99, "total_tokens": 29897312} {"current_steps": 23600, "total_steps": 40000, "eval_loss": 0.06635206192731857, "epoch": 1.1531282828036058, "percentage": 59.0, "elapsed_time": "1 day, 1:02:35", "remaining_time": "17:24:10", "throughput": 331.62, "total_tokens": 29897312} {"current_steps": 23605, "total_steps": 40000, "loss": 0.0498, "lr": 0.10810608338618573, "epoch": 1.1533725844673002, "percentage": 59.01, "elapsed_time": "1 day, 1:02:39", "remaining_time": "17:23:40", "throughput": 331.68, "total_tokens": 29904224} {"current_steps": 23610, "total_steps": 40000, "loss": 0.0586, "lr": 0.10804952581630821, "epoch": 1.1536168861309946, "percentage": 59.03, "elapsed_time": "1 day, 1:02:42", "remaining_time": "17:23:10", "throughput": 331.74, "total_tokens": 29910144} {"current_steps": 23615, "total_steps": 40000, "loss": 0.0764, "lr": 0.10799297471572102, "epoch": 1.153861187794689, "percentage": 59.04, "elapsed_time": "1 day, 1:02:45", "remaining_time": "17:22:40", "throughput": 331.79, "total_tokens": 29916160} {"current_steps": 23620, "total_steps": 40000, "loss": 0.045, "lr": 0.10793643009314507, "epoch": 1.154105489458383, "percentage": 59.05, "elapsed_time": "1 day, 1:02:48", "remaining_time": "17:22:09", "throughput": 331.85, "total_tokens": 29922240} {"current_steps": 23625, "total_steps": 40000, "loss": 0.0372, "lr": 0.10787989195730015, "epoch": 1.1543497911220775, "percentage": 59.06, "elapsed_time": "1 day, 1:02:51", "remaining_time": "17:21:39", "throughput": 331.91, "total_tokens": 29928896} {"current_steps": 23630, "total_steps": 40000, "loss": 0.0646, "lr": 0.10782336031690525, "epoch": 1.1545940927857719, "percentage": 59.08, "elapsed_time": "1 day, 1:02:54", "remaining_time": "17:21:09", "throughput": 331.97, "total_tokens": 29935168} {"current_steps": 23635, "total_steps": 40000, "loss": 0.0441, "lr": 0.10776683518067821, "epoch": 1.1548383944494662, "percentage": 59.09, "elapsed_time": "1 day, 1:02:57", "remaining_time": "17:20:39", "throughput": 332.03, "total_tokens": 29941696} {"current_steps": 23640, "total_steps": 40000, "loss": 0.0659, "lr": 0.10771031655733587, "epoch": 1.1550826961131606, "percentage": 59.1, "elapsed_time": "1 day, 1:03:00", "remaining_time": "17:20:09", "throughput": 332.1, "total_tokens": 29948576} {"current_steps": 23645, "total_steps": 40000, "loss": 0.0609, "lr": 0.10765380445559422, "epoch": 1.1553269977768548, "percentage": 59.11, "elapsed_time": "1 day, 1:03:03", "remaining_time": "17:19:39", "throughput": 332.16, "total_tokens": 29955296} {"current_steps": 23650, "total_steps": 40000, "loss": 0.0607, "lr": 0.10759729888416801, "epoch": 1.1555712994405491, "percentage": 59.13, "elapsed_time": "1 day, 1:03:07", "remaining_time": "17:19:09", "throughput": 332.22, "total_tokens": 29962016} {"current_steps": 23655, "total_steps": 40000, "loss": 0.0519, "lr": 0.10754079985177119, "epoch": 1.1558156011042435, "percentage": 59.14, "elapsed_time": "1 day, 1:03:10", "remaining_time": "17:18:39", "throughput": 332.28, "total_tokens": 29968416} {"current_steps": 23660, "total_steps": 40000, "loss": 0.0639, "lr": 0.10748430736711667, "epoch": 1.156059902767938, "percentage": 59.15, "elapsed_time": "1 day, 1:03:13", "remaining_time": "17:18:09", "throughput": 332.34, "total_tokens": 29974752} {"current_steps": 23665, "total_steps": 40000, "loss": 0.0532, "lr": 0.10742782143891623, "epoch": 1.156304204431632, "percentage": 59.16, "elapsed_time": "1 day, 1:03:16", "remaining_time": "17:17:38", "throughput": 332.4, "total_tokens": 29981088} {"current_steps": 23670, "total_steps": 40000, "loss": 0.0356, "lr": 0.10737134207588069, "epoch": 1.1565485060953264, "percentage": 59.17, "elapsed_time": "1 day, 1:03:19", "remaining_time": "17:17:08", "throughput": 332.46, "total_tokens": 29987968} {"current_steps": 23675, "total_steps": 40000, "loss": 0.0331, "lr": 0.10731486928671992, "epoch": 1.1567928077590208, "percentage": 59.19, "elapsed_time": "1 day, 1:03:22", "remaining_time": "17:16:38", "throughput": 332.52, "total_tokens": 29994208} {"current_steps": 23680, "total_steps": 40000, "loss": 0.067, "lr": 0.10725840308014269, "epoch": 1.1570371094227152, "percentage": 59.2, "elapsed_time": "1 day, 1:03:25", "remaining_time": "17:16:08", "throughput": 332.58, "total_tokens": 30000448} {"current_steps": 23685, "total_steps": 40000, "loss": 0.0705, "lr": 0.10720194346485688, "epoch": 1.1572814110864096, "percentage": 59.21, "elapsed_time": "1 day, 1:03:28", "remaining_time": "17:15:38", "throughput": 332.64, "total_tokens": 30007104} {"current_steps": 23690, "total_steps": 40000, "loss": 0.0655, "lr": 0.10714549044956918, "epoch": 1.1575257127501037, "percentage": 59.23, "elapsed_time": "1 day, 1:03:31", "remaining_time": "17:15:08", "throughput": 332.7, "total_tokens": 30013440} {"current_steps": 23695, "total_steps": 40000, "loss": 0.0463, "lr": 0.10708904404298542, "epoch": 1.1577700144137981, "percentage": 59.24, "elapsed_time": "1 day, 1:03:35", "remaining_time": "17:14:38", "throughput": 332.76, "total_tokens": 30019968} {"current_steps": 23700, "total_steps": 40000, "loss": 0.0635, "lr": 0.1070326042538103, "epoch": 1.1580143160774925, "percentage": 59.25, "elapsed_time": "1 day, 1:03:38", "remaining_time": "17:14:08", "throughput": 332.82, "total_tokens": 30026208} {"current_steps": 23705, "total_steps": 40000, "loss": 0.0682, "lr": 0.10697617109074758, "epoch": 1.1582586177411869, "percentage": 59.26, "elapsed_time": "1 day, 1:03:41", "remaining_time": "17:13:38", "throughput": 332.87, "total_tokens": 30032192} {"current_steps": 23710, "total_steps": 40000, "loss": 0.0485, "lr": 0.10691974456249999, "epoch": 1.158502919404881, "percentage": 59.27, "elapsed_time": "1 day, 1:03:44", "remaining_time": "17:13:08", "throughput": 332.93, "total_tokens": 30038208} {"current_steps": 23715, "total_steps": 40000, "loss": 0.0458, "lr": 0.10686332467776909, "epoch": 1.1587472210685754, "percentage": 59.29, "elapsed_time": "1 day, 1:03:47", "remaining_time": "17:12:38", "throughput": 332.99, "total_tokens": 30044672} {"current_steps": 23720, "total_steps": 40000, "loss": 0.0724, "lr": 0.10680691144525563, "epoch": 1.1589915227322698, "percentage": 59.3, "elapsed_time": "1 day, 1:03:50", "remaining_time": "17:12:08", "throughput": 333.05, "total_tokens": 30051168} {"current_steps": 23725, "total_steps": 40000, "loss": 0.0563, "lr": 0.10675050487365928, "epoch": 1.1592358243959642, "percentage": 59.31, "elapsed_time": "1 day, 1:03:53", "remaining_time": "17:11:38", "throughput": 333.11, "total_tokens": 30057568} {"current_steps": 23730, "total_steps": 40000, "loss": 0.0529, "lr": 0.10669410497167851, "epoch": 1.1594801260596586, "percentage": 59.33, "elapsed_time": "1 day, 1:03:56", "remaining_time": "17:11:08", "throughput": 333.17, "total_tokens": 30064032} {"current_steps": 23735, "total_steps": 40000, "loss": 0.11, "lr": 0.10663771174801102, "epoch": 1.1597244277233527, "percentage": 59.34, "elapsed_time": "1 day, 1:03:59", "remaining_time": "17:10:38", "throughput": 333.23, "total_tokens": 30070144} {"current_steps": 23740, "total_steps": 40000, "loss": 0.0559, "lr": 0.10658132521135329, "epoch": 1.159968729387047, "percentage": 59.35, "elapsed_time": "1 day, 1:04:02", "remaining_time": "17:10:09", "throughput": 333.29, "total_tokens": 30076864} {"current_steps": 23745, "total_steps": 40000, "loss": 0.063, "lr": 0.10652494537040084, "epoch": 1.1602130310507415, "percentage": 59.36, "elapsed_time": "1 day, 1:04:05", "remaining_time": "17:09:39", "throughput": 333.35, "total_tokens": 30083264} {"current_steps": 23750, "total_steps": 40000, "loss": 0.0814, "lr": 0.1064685722338482, "epoch": 1.1604573327144359, "percentage": 59.38, "elapsed_time": "1 day, 1:04:09", "remaining_time": "17:09:09", "throughput": 333.41, "total_tokens": 30089792} {"current_steps": 23755, "total_steps": 40000, "loss": 0.0619, "lr": 0.10641220581038871, "epoch": 1.16070163437813, "percentage": 59.39, "elapsed_time": "1 day, 1:04:12", "remaining_time": "17:08:39", "throughput": 333.47, "total_tokens": 30096256} {"current_steps": 23760, "total_steps": 40000, "loss": 0.0579, "lr": 0.10635584610871483, "epoch": 1.1609459360418244, "percentage": 59.4, "elapsed_time": "1 day, 1:04:15", "remaining_time": "17:08:09", "throughput": 333.53, "total_tokens": 30102976} {"current_steps": 23765, "total_steps": 40000, "loss": 0.0681, "lr": 0.10629949313751803, "epoch": 1.1611902377055188, "percentage": 59.41, "elapsed_time": "1 day, 1:04:18", "remaining_time": "17:07:39", "throughput": 333.59, "total_tokens": 30109408} {"current_steps": 23770, "total_steps": 40000, "loss": 0.0538, "lr": 0.10624314690548849, "epoch": 1.1614345393692131, "percentage": 59.42, "elapsed_time": "1 day, 1:04:21", "remaining_time": "17:07:09", "throughput": 333.65, "total_tokens": 30115584} {"current_steps": 23775, "total_steps": 40000, "loss": 0.0419, "lr": 0.1061868074213156, "epoch": 1.1616788410329075, "percentage": 59.44, "elapsed_time": "1 day, 1:04:24", "remaining_time": "17:06:40", "throughput": 333.71, "total_tokens": 30122528} {"current_steps": 23780, "total_steps": 40000, "loss": 0.0484, "lr": 0.10613047469368765, "epoch": 1.1619231426966017, "percentage": 59.45, "elapsed_time": "1 day, 1:04:27", "remaining_time": "17:06:10", "throughput": 333.77, "total_tokens": 30128960} {"current_steps": 23785, "total_steps": 40000, "loss": 0.0444, "lr": 0.10607414873129171, "epoch": 1.162167444360296, "percentage": 59.46, "elapsed_time": "1 day, 1:04:30", "remaining_time": "17:05:40", "throughput": 333.83, "total_tokens": 30134720} {"current_steps": 23790, "total_steps": 40000, "loss": 0.0563, "lr": 0.10601782954281413, "epoch": 1.1624117460239904, "percentage": 59.48, "elapsed_time": "1 day, 1:04:33", "remaining_time": "17:05:10", "throughput": 333.88, "total_tokens": 30141056} {"current_steps": 23795, "total_steps": 40000, "loss": 0.0659, "lr": 0.1059615171369399, "epoch": 1.1626560476876848, "percentage": 59.49, "elapsed_time": "1 day, 1:04:37", "remaining_time": "17:04:40", "throughput": 333.94, "total_tokens": 30147424} {"current_steps": 23800, "total_steps": 40000, "loss": 0.0509, "lr": 0.10590521152235312, "epoch": 1.162900349351379, "percentage": 59.5, "elapsed_time": "1 day, 1:04:40", "remaining_time": "17:04:11", "throughput": 334.0, "total_tokens": 30153920} {"current_steps": 23800, "total_steps": 40000, "eval_loss": 0.06390811502933502, "epoch": 1.162900349351379, "percentage": 59.5, "elapsed_time": "1 day, 1:15:20", "remaining_time": "17:11:27", "throughput": 331.65, "total_tokens": 30153920} {"current_steps": 23805, "total_steps": 40000, "loss": 0.0554, "lr": 0.1058489127077369, "epoch": 1.1631446510150734, "percentage": 59.51, "elapsed_time": "1 day, 1:15:24", "remaining_time": "17:10:57", "throughput": 331.7, "total_tokens": 30159776} {"current_steps": 23810, "total_steps": 40000, "loss": 0.0802, "lr": 0.1057926207017732, "epoch": 1.1633889526787677, "percentage": 59.52, "elapsed_time": "1 day, 1:15:27", "remaining_time": "17:10:27", "throughput": 331.76, "total_tokens": 30166080} {"current_steps": 23815, "total_steps": 40000, "loss": 0.0557, "lr": 0.10573633551314285, "epoch": 1.1636332543424621, "percentage": 59.54, "elapsed_time": "1 day, 1:15:30", "remaining_time": "17:09:57", "throughput": 331.82, "total_tokens": 30172608} {"current_steps": 23820, "total_steps": 40000, "loss": 0.0474, "lr": 0.1056800571505259, "epoch": 1.1638775560061565, "percentage": 59.55, "elapsed_time": "1 day, 1:15:33", "remaining_time": "17:09:27", "throughput": 331.88, "total_tokens": 30179360} {"current_steps": 23825, "total_steps": 40000, "loss": 0.0725, "lr": 0.10562378562260105, "epoch": 1.1641218576698507, "percentage": 59.56, "elapsed_time": "1 day, 1:15:36", "remaining_time": "17:08:57", "throughput": 331.94, "total_tokens": 30185888} {"current_steps": 23830, "total_steps": 40000, "loss": 0.0768, "lr": 0.10556752093804615, "epoch": 1.164366159333545, "percentage": 59.58, "elapsed_time": "1 day, 1:15:39", "remaining_time": "17:08:27", "throughput": 332.01, "total_tokens": 30192800} {"current_steps": 23835, "total_steps": 40000, "loss": 0.0521, "lr": 0.10551126310553786, "epoch": 1.1646104609972394, "percentage": 59.59, "elapsed_time": "1 day, 1:15:43", "remaining_time": "17:07:57", "throughput": 332.07, "total_tokens": 30199392} {"current_steps": 23840, "total_steps": 40000, "loss": 0.0422, "lr": 0.10545501213375187, "epoch": 1.1648547626609338, "percentage": 59.6, "elapsed_time": "1 day, 1:15:46", "remaining_time": "17:07:28", "throughput": 332.12, "total_tokens": 30205280} {"current_steps": 23845, "total_steps": 40000, "loss": 0.0358, "lr": 0.10539876803136287, "epoch": 1.165099064324628, "percentage": 59.61, "elapsed_time": "1 day, 1:15:49", "remaining_time": "17:06:58", "throughput": 332.19, "total_tokens": 30212096} {"current_steps": 23850, "total_steps": 40000, "loss": 0.0663, "lr": 0.10534253080704428, "epoch": 1.1653433659883223, "percentage": 59.62, "elapsed_time": "1 day, 1:15:52", "remaining_time": "17:06:28", "throughput": 332.24, "total_tokens": 30218336} {"current_steps": 23855, "total_steps": 40000, "loss": 0.0716, "lr": 0.10528630046946862, "epoch": 1.1655876676520167, "percentage": 59.64, "elapsed_time": "1 day, 1:15:55", "remaining_time": "17:05:58", "throughput": 332.3, "total_tokens": 30224640} {"current_steps": 23860, "total_steps": 40000, "loss": 0.0433, "lr": 0.1052300770273074, "epoch": 1.165831969315711, "percentage": 59.65, "elapsed_time": "1 day, 1:15:58", "remaining_time": "17:05:28", "throughput": 332.36, "total_tokens": 30231264} {"current_steps": 23865, "total_steps": 40000, "loss": 0.0634, "lr": 0.10517386048923086, "epoch": 1.1660762709794055, "percentage": 59.66, "elapsed_time": "1 day, 1:16:01", "remaining_time": "17:04:58", "throughput": 332.42, "total_tokens": 30237568} {"current_steps": 23870, "total_steps": 40000, "loss": 0.0258, "lr": 0.10511765086390841, "epoch": 1.1663205726430996, "percentage": 59.67, "elapsed_time": "1 day, 1:16:04", "remaining_time": "17:04:28", "throughput": 332.48, "total_tokens": 30243904} {"current_steps": 23875, "total_steps": 40000, "loss": 0.0704, "lr": 0.10506144816000816, "epoch": 1.166564874306794, "percentage": 59.69, "elapsed_time": "1 day, 1:16:07", "remaining_time": "17:03:58", "throughput": 332.54, "total_tokens": 30250272} {"current_steps": 23880, "total_steps": 40000, "loss": 0.0532, "lr": 0.10500525238619736, "epoch": 1.1668091759704884, "percentage": 59.7, "elapsed_time": "1 day, 1:16:10", "remaining_time": "17:03:29", "throughput": 332.59, "total_tokens": 30256352} {"current_steps": 23885, "total_steps": 40000, "loss": 0.0627, "lr": 0.10494906355114209, "epoch": 1.1670534776341828, "percentage": 59.71, "elapsed_time": "1 day, 1:16:13", "remaining_time": "17:02:59", "throughput": 332.65, "total_tokens": 30262656} {"current_steps": 23890, "total_steps": 40000, "loss": 0.0835, "lr": 0.10489288166350737, "epoch": 1.167297779297877, "percentage": 59.72, "elapsed_time": "1 day, 1:16:16", "remaining_time": "17:02:29", "throughput": 332.71, "total_tokens": 30268960} {"current_steps": 23895, "total_steps": 40000, "loss": 0.0682, "lr": 0.10483670673195711, "epoch": 1.1675420809615713, "percentage": 59.74, "elapsed_time": "1 day, 1:16:20", "remaining_time": "17:01:59", "throughput": 332.77, "total_tokens": 30275552} {"current_steps": 23900, "total_steps": 40000, "loss": 0.0663, "lr": 0.10478053876515431, "epoch": 1.1677863826252657, "percentage": 59.75, "elapsed_time": "1 day, 1:16:23", "remaining_time": "17:01:29", "throughput": 332.83, "total_tokens": 30282240} {"current_steps": 23905, "total_steps": 40000, "loss": 0.0676, "lr": 0.10472437777176061, "epoch": 1.16803068428896, "percentage": 59.76, "elapsed_time": "1 day, 1:16:26", "remaining_time": "17:01:00", "throughput": 332.89, "total_tokens": 30288416} {"current_steps": 23910, "total_steps": 40000, "loss": 0.0926, "lr": 0.1046682237604369, "epoch": 1.1682749859526544, "percentage": 59.77, "elapsed_time": "1 day, 1:16:29", "remaining_time": "17:00:30", "throughput": 332.94, "total_tokens": 30294368} {"current_steps": 23915, "total_steps": 40000, "loss": 0.0536, "lr": 0.1046120767398427, "epoch": 1.1685192876163486, "percentage": 59.79, "elapsed_time": "1 day, 1:16:32", "remaining_time": "17:00:00", "throughput": 333.0, "total_tokens": 30300384} {"current_steps": 23920, "total_steps": 40000, "loss": 0.054, "lr": 0.10455593671863667, "epoch": 1.168763589280043, "percentage": 59.8, "elapsed_time": "1 day, 1:16:35", "remaining_time": "16:59:30", "throughput": 333.06, "total_tokens": 30306720} {"current_steps": 23925, "total_steps": 40000, "loss": 0.0647, "lr": 0.1044998037054763, "epoch": 1.1690078909437374, "percentage": 59.81, "elapsed_time": "1 day, 1:16:38", "remaining_time": "16:59:01", "throughput": 333.12, "total_tokens": 30313024} {"current_steps": 23930, "total_steps": 40000, "loss": 0.0434, "lr": 0.10444367770901794, "epoch": 1.1692521926074317, "percentage": 59.82, "elapsed_time": "1 day, 1:16:41", "remaining_time": "16:58:31", "throughput": 333.17, "total_tokens": 30318880} {"current_steps": 23935, "total_steps": 40000, "loss": 0.0415, "lr": 0.10438755873791698, "epoch": 1.169496494271126, "percentage": 59.84, "elapsed_time": "1 day, 1:16:44", "remaining_time": "16:58:01", "throughput": 333.23, "total_tokens": 30325376} {"current_steps": 23940, "total_steps": 40000, "loss": 0.0827, "lr": 0.10433144680082775, "epoch": 1.1697407959348203, "percentage": 59.85, "elapsed_time": "1 day, 1:16:47", "remaining_time": "16:57:31", "throughput": 333.29, "total_tokens": 30331616} {"current_steps": 23945, "total_steps": 40000, "loss": 0.0518, "lr": 0.10427534190640322, "epoch": 1.1699850975985147, "percentage": 59.86, "elapsed_time": "1 day, 1:16:50", "remaining_time": "16:57:02", "throughput": 333.35, "total_tokens": 30338400} {"current_steps": 23950, "total_steps": 40000, "loss": 0.0701, "lr": 0.10421924406329568, "epoch": 1.170229399262209, "percentage": 59.88, "elapsed_time": "1 day, 1:16:54", "remaining_time": "16:56:32", "throughput": 333.41, "total_tokens": 30344864} {"current_steps": 23955, "total_steps": 40000, "loss": 0.0258, "lr": 0.10416315328015598, "epoch": 1.1704737009259034, "percentage": 59.89, "elapsed_time": "1 day, 1:16:57", "remaining_time": "16:56:03", "throughput": 333.47, "total_tokens": 30351104} {"current_steps": 23960, "total_steps": 40000, "loss": 0.0642, "lr": 0.10410706956563402, "epoch": 1.1707180025895976, "percentage": 59.9, "elapsed_time": "1 day, 1:17:00", "remaining_time": "16:55:33", "throughput": 333.53, "total_tokens": 30357536} {"current_steps": 23965, "total_steps": 40000, "loss": 0.0862, "lr": 0.10405099292837874, "epoch": 1.170962304253292, "percentage": 59.91, "elapsed_time": "1 day, 1:17:03", "remaining_time": "16:55:03", "throughput": 333.58, "total_tokens": 30363616} {"current_steps": 23970, "total_steps": 40000, "loss": 0.0539, "lr": 0.10399492337703771, "epoch": 1.1712066059169863, "percentage": 59.92, "elapsed_time": "1 day, 1:17:06", "remaining_time": "16:54:34", "throughput": 333.64, "total_tokens": 30370048} {"current_steps": 23975, "total_steps": 40000, "loss": 0.0541, "lr": 0.10393886092025764, "epoch": 1.1714509075806807, "percentage": 59.94, "elapsed_time": "1 day, 1:17:09", "remaining_time": "16:54:04", "throughput": 333.7, "total_tokens": 30376480} {"current_steps": 23980, "total_steps": 40000, "loss": 0.0533, "lr": 0.10388280556668412, "epoch": 1.1716952092443749, "percentage": 59.95, "elapsed_time": "1 day, 1:17:12", "remaining_time": "16:53:34", "throughput": 333.76, "total_tokens": 30382944} {"current_steps": 23985, "total_steps": 40000, "loss": 0.0588, "lr": 0.10382675732496145, "epoch": 1.1719395109080692, "percentage": 59.96, "elapsed_time": "1 day, 1:17:15", "remaining_time": "16:53:05", "throughput": 333.82, "total_tokens": 30389376} {"current_steps": 23990, "total_steps": 40000, "loss": 0.0697, "lr": 0.10377071620373311, "epoch": 1.1721838125717636, "percentage": 59.98, "elapsed_time": "1 day, 1:17:18", "remaining_time": "16:52:35", "throughput": 333.87, "total_tokens": 30395296} {"current_steps": 23995, "total_steps": 40000, "loss": 0.0327, "lr": 0.10371468221164128, "epoch": 1.172428114235458, "percentage": 59.99, "elapsed_time": "1 day, 1:17:21", "remaining_time": "16:52:06", "throughput": 333.93, "total_tokens": 30401376} {"current_steps": 24000, "total_steps": 40000, "loss": 0.0795, "lr": 0.10365865535732706, "epoch": 1.1726724158991524, "percentage": 60.0, "elapsed_time": "1 day, 1:17:24", "remaining_time": "16:51:36", "throughput": 333.99, "total_tokens": 30407616} {"current_steps": 24000, "total_steps": 40000, "eval_loss": 0.0641462430357933, "epoch": 1.1726724158991524, "percentage": 60.0, "elapsed_time": "1 day, 1:28:04", "remaining_time": "16:58:43", "throughput": 331.65, "total_tokens": 30407616} {"current_steps": 24005, "total_steps": 40000, "loss": 0.0564, "lr": 0.10360263564943062, "epoch": 1.1729167175628465, "percentage": 60.01, "elapsed_time": "1 day, 1:28:08", "remaining_time": "16:58:13", "throughput": 331.71, "total_tokens": 30413824} {"current_steps": 24010, "total_steps": 40000, "loss": 0.0573, "lr": 0.10354662309659075, "epoch": 1.173161019226541, "percentage": 60.02, "elapsed_time": "1 day, 1:28:11", "remaining_time": "16:57:44", "throughput": 331.76, "total_tokens": 30419936} {"current_steps": 24015, "total_steps": 40000, "loss": 0.0986, "lr": 0.10349061770744537, "epoch": 1.1734053208902353, "percentage": 60.04, "elapsed_time": "1 day, 1:28:14", "remaining_time": "16:57:14", "throughput": 331.81, "total_tokens": 30425376} {"current_steps": 24020, "total_steps": 40000, "loss": 0.0752, "lr": 0.10343461949063128, "epoch": 1.1736496225539297, "percentage": 60.05, "elapsed_time": "1 day, 1:28:17", "remaining_time": "16:56:44", "throughput": 331.87, "total_tokens": 30431296} {"current_steps": 24025, "total_steps": 40000, "loss": 0.0767, "lr": 0.103378628454784, "epoch": 1.1738939242176238, "percentage": 60.06, "elapsed_time": "1 day, 1:28:20", "remaining_time": "16:56:14", "throughput": 331.92, "total_tokens": 30437472} {"current_steps": 24030, "total_steps": 40000, "loss": 0.0634, "lr": 0.10332264460853811, "epoch": 1.1741382258813182, "percentage": 60.08, "elapsed_time": "1 day, 1:28:23", "remaining_time": "16:55:44", "throughput": 331.98, "total_tokens": 30443680} {"current_steps": 24035, "total_steps": 40000, "loss": 0.0548, "lr": 0.10326666796052701, "epoch": 1.1743825275450126, "percentage": 60.09, "elapsed_time": "1 day, 1:28:26", "remaining_time": "16:55:15", "throughput": 332.03, "total_tokens": 30449760} {"current_steps": 24040, "total_steps": 40000, "loss": 0.0486, "lr": 0.10321069851938296, "epoch": 1.174626829208707, "percentage": 60.1, "elapsed_time": "1 day, 1:28:29", "remaining_time": "16:54:45", "throughput": 332.09, "total_tokens": 30456064} {"current_steps": 24045, "total_steps": 40000, "loss": 0.0809, "lr": 0.10315473629373724, "epoch": 1.1748711308724014, "percentage": 60.11, "elapsed_time": "1 day, 1:28:32", "remaining_time": "16:54:15", "throughput": 332.15, "total_tokens": 30462240} {"current_steps": 24050, "total_steps": 40000, "loss": 0.0629, "lr": 0.10309878129221982, "epoch": 1.1751154325360955, "percentage": 60.12, "elapsed_time": "1 day, 1:28:35", "remaining_time": "16:53:46", "throughput": 332.21, "total_tokens": 30469024} {"current_steps": 24055, "total_steps": 40000, "loss": 0.0605, "lr": 0.10304283352345973, "epoch": 1.17535973419979, "percentage": 60.14, "elapsed_time": "1 day, 1:28:38", "remaining_time": "16:53:16", "throughput": 332.27, "total_tokens": 30475520} {"current_steps": 24060, "total_steps": 40000, "loss": 0.0579, "lr": 0.10298689299608486, "epoch": 1.1756040358634843, "percentage": 60.15, "elapsed_time": "1 day, 1:28:42", "remaining_time": "16:52:46", "throughput": 332.33, "total_tokens": 30482240} {"current_steps": 24065, "total_steps": 40000, "loss": 0.0446, "lr": 0.10293095971872188, "epoch": 1.1758483375271787, "percentage": 60.16, "elapsed_time": "1 day, 1:28:45", "remaining_time": "16:52:17", "throughput": 332.39, "total_tokens": 30488608} {"current_steps": 24070, "total_steps": 40000, "loss": 0.0465, "lr": 0.10287503369999645, "epoch": 1.1760926391908728, "percentage": 60.17, "elapsed_time": "1 day, 1:28:48", "remaining_time": "16:51:47", "throughput": 332.45, "total_tokens": 30495520} {"current_steps": 24075, "total_steps": 40000, "loss": 0.0458, "lr": 0.10281911494853295, "epoch": 1.1763369408545672, "percentage": 60.19, "elapsed_time": "1 day, 1:28:51", "remaining_time": "16:51:18", "throughput": 332.51, "total_tokens": 30501952} {"current_steps": 24080, "total_steps": 40000, "loss": 0.043, "lr": 0.10276320347295485, "epoch": 1.1765812425182616, "percentage": 60.2, "elapsed_time": "1 day, 1:28:54", "remaining_time": "16:50:48", "throughput": 332.57, "total_tokens": 30508128} {"current_steps": 24085, "total_steps": 40000, "loss": 0.0437, "lr": 0.10270729928188446, "epoch": 1.176825544181956, "percentage": 60.21, "elapsed_time": "1 day, 1:28:57", "remaining_time": "16:50:18", "throughput": 332.62, "total_tokens": 30513792} {"current_steps": 24090, "total_steps": 40000, "loss": 0.0726, "lr": 0.10265140238394276, "epoch": 1.1770698458456503, "percentage": 60.22, "elapsed_time": "1 day, 1:29:00", "remaining_time": "16:49:49", "throughput": 332.68, "total_tokens": 30519840} {"current_steps": 24095, "total_steps": 40000, "loss": 0.0539, "lr": 0.10259551278774988, "epoch": 1.1773141475093445, "percentage": 60.24, "elapsed_time": "1 day, 1:29:03", "remaining_time": "16:49:19", "throughput": 332.73, "total_tokens": 30526112} {"current_steps": 24100, "total_steps": 40000, "loss": 0.0797, "lr": 0.10253963050192462, "epoch": 1.1775584491730389, "percentage": 60.25, "elapsed_time": "1 day, 1:29:06", "remaining_time": "16:48:50", "throughput": 332.79, "total_tokens": 30532672} {"current_steps": 24105, "total_steps": 40000, "loss": 0.0627, "lr": 0.10248375553508478, "epoch": 1.1778027508367332, "percentage": 60.26, "elapsed_time": "1 day, 1:29:09", "remaining_time": "16:48:20", "throughput": 332.85, "total_tokens": 30538656} {"current_steps": 24110, "total_steps": 40000, "loss": 0.075, "lr": 0.102427887895847, "epoch": 1.1780470525004274, "percentage": 60.27, "elapsed_time": "1 day, 1:29:12", "remaining_time": "16:47:50", "throughput": 332.9, "total_tokens": 30544384} {"current_steps": 24115, "total_steps": 40000, "loss": 0.0687, "lr": 0.10237202759282668, "epoch": 1.1782913541641218, "percentage": 60.29, "elapsed_time": "1 day, 1:29:15", "remaining_time": "16:47:21", "throughput": 332.95, "total_tokens": 30550464} {"current_steps": 24120, "total_steps": 40000, "loss": 0.0565, "lr": 0.10231617463463821, "epoch": 1.1785356558278162, "percentage": 60.3, "elapsed_time": "1 day, 1:29:19", "remaining_time": "16:46:51", "throughput": 333.01, "total_tokens": 30556384} {"current_steps": 24125, "total_steps": 40000, "loss": 0.076, "lr": 0.10226032902989492, "epoch": 1.1787799574915105, "percentage": 60.31, "elapsed_time": "1 day, 1:29:22", "remaining_time": "16:46:22", "throughput": 333.06, "total_tokens": 30562272} {"current_steps": 24130, "total_steps": 40000, "loss": 0.0697, "lr": 0.10220449078720877, "epoch": 1.179024259155205, "percentage": 60.32, "elapsed_time": "1 day, 1:29:25", "remaining_time": "16:45:52", "throughput": 333.11, "total_tokens": 30568032} {"current_steps": 24135, "total_steps": 40000, "loss": 0.0478, "lr": 0.1021486599151908, "epoch": 1.179268560818899, "percentage": 60.34, "elapsed_time": "1 day, 1:29:28", "remaining_time": "16:45:23", "throughput": 333.17, "total_tokens": 30574240} {"current_steps": 24140, "total_steps": 40000, "loss": 0.0416, "lr": 0.10209283642245084, "epoch": 1.1795128624825935, "percentage": 60.35, "elapsed_time": "1 day, 1:29:31", "remaining_time": "16:44:53", "throughput": 333.23, "total_tokens": 30580704} {"current_steps": 24145, "total_steps": 40000, "loss": 0.0428, "lr": 0.10203702031759748, "epoch": 1.1797571641462878, "percentage": 60.36, "elapsed_time": "1 day, 1:29:34", "remaining_time": "16:44:24", "throughput": 333.28, "total_tokens": 30586784} {"current_steps": 24150, "total_steps": 40000, "loss": 0.0663, "lr": 0.1019812116092384, "epoch": 1.1800014658099822, "percentage": 60.38, "elapsed_time": "1 day, 1:29:37", "remaining_time": "16:43:54", "throughput": 333.34, "total_tokens": 30592864} {"current_steps": 24155, "total_steps": 40000, "loss": 0.064, "lr": 0.10192541030597986, "epoch": 1.1802457674736764, "percentage": 60.39, "elapsed_time": "1 day, 1:29:40", "remaining_time": "16:43:25", "throughput": 333.39, "total_tokens": 30599072} {"current_steps": 24160, "total_steps": 40000, "loss": 0.0638, "lr": 0.1018696164164272, "epoch": 1.1804900691373708, "percentage": 60.4, "elapsed_time": "1 day, 1:29:43", "remaining_time": "16:42:55", "throughput": 333.46, "total_tokens": 30606112} {"current_steps": 24165, "total_steps": 40000, "loss": 0.0577, "lr": 0.10181382994918459, "epoch": 1.1807343708010651, "percentage": 60.41, "elapsed_time": "1 day, 1:29:46", "remaining_time": "16:42:26", "throughput": 333.52, "total_tokens": 30612416} {"current_steps": 24170, "total_steps": 40000, "loss": 0.0668, "lr": 0.10175805091285492, "epoch": 1.1809786724647595, "percentage": 60.42, "elapsed_time": "1 day, 1:29:49", "remaining_time": "16:41:57", "throughput": 333.58, "total_tokens": 30618944} {"current_steps": 24175, "total_steps": 40000, "loss": 0.0441, "lr": 0.10170227931603999, "epoch": 1.181222974128454, "percentage": 60.44, "elapsed_time": "1 day, 1:29:52", "remaining_time": "16:41:27", "throughput": 333.63, "total_tokens": 30625088} {"current_steps": 24180, "total_steps": 40000, "loss": 0.06, "lr": 0.10164651516734062, "epoch": 1.181467275792148, "percentage": 60.45, "elapsed_time": "1 day, 1:29:55", "remaining_time": "16:40:58", "throughput": 333.69, "total_tokens": 30631552} {"current_steps": 24185, "total_steps": 40000, "loss": 0.0474, "lr": 0.1015907584753562, "epoch": 1.1817115774558424, "percentage": 60.46, "elapsed_time": "1 day, 1:29:59", "remaining_time": "16:40:29", "throughput": 333.75, "total_tokens": 30637792} {"current_steps": 24190, "total_steps": 40000, "loss": 0.0698, "lr": 0.10153500924868523, "epoch": 1.1819558791195368, "percentage": 60.48, "elapsed_time": "1 day, 1:30:02", "remaining_time": "16:39:59", "throughput": 333.81, "total_tokens": 30644128} {"current_steps": 24195, "total_steps": 40000, "loss": 0.0402, "lr": 0.10147926749592483, "epoch": 1.1822001807832312, "percentage": 60.49, "elapsed_time": "1 day, 1:30:05", "remaining_time": "16:39:30", "throughput": 333.87, "total_tokens": 30650592} {"current_steps": 24200, "total_steps": 40000, "loss": 0.0646, "lr": 0.10142353322567112, "epoch": 1.1824444824469253, "percentage": 60.5, "elapsed_time": "1 day, 1:30:08", "remaining_time": "16:39:00", "throughput": 333.92, "total_tokens": 30656768} {"current_steps": 24200, "total_steps": 40000, "eval_loss": 0.06363477557897568, "epoch": 1.1824444824469253, "percentage": 60.5, "elapsed_time": "1 day, 1:40:48", "remaining_time": "16:45:59", "throughput": 331.61, "total_tokens": 30656768} {"current_steps": 24205, "total_steps": 40000, "loss": 0.0469, "lr": 0.1013678064465191, "epoch": 1.1826887841106197, "percentage": 60.51, "elapsed_time": "1 day, 1:40:52", "remaining_time": "16:45:30", "throughput": 331.67, "total_tokens": 30663584} {"current_steps": 24210, "total_steps": 40000, "loss": 0.0388, "lr": 0.10131208716706244, "epoch": 1.182933085774314, "percentage": 60.52, "elapsed_time": "1 day, 1:40:55", "remaining_time": "16:45:00", "throughput": 331.72, "total_tokens": 30669792} {"current_steps": 24215, "total_steps": 40000, "loss": 0.0594, "lr": 0.10125637539589379, "epoch": 1.1831773874380085, "percentage": 60.54, "elapsed_time": "1 day, 1:40:58", "remaining_time": "16:44:30", "throughput": 331.78, "total_tokens": 30676128} {"current_steps": 24220, "total_steps": 40000, "loss": 0.0576, "lr": 0.10120067114160464, "epoch": 1.1834216891017029, "percentage": 60.55, "elapsed_time": "1 day, 1:41:01", "remaining_time": "16:44:01", "throughput": 331.84, "total_tokens": 30682944} {"current_steps": 24225, "total_steps": 40000, "loss": 0.0663, "lr": 0.10114497441278517, "epoch": 1.183665990765397, "percentage": 60.56, "elapsed_time": "1 day, 1:41:05", "remaining_time": "16:43:32", "throughput": 331.9, "total_tokens": 30689248} {"current_steps": 24230, "total_steps": 40000, "loss": 0.0468, "lr": 0.10108928521802468, "epoch": 1.1839102924290914, "percentage": 60.58, "elapsed_time": "1 day, 1:41:08", "remaining_time": "16:43:02", "throughput": 331.96, "total_tokens": 30695424} {"current_steps": 24235, "total_steps": 40000, "loss": 0.0434, "lr": 0.101033603565911, "epoch": 1.1841545940927858, "percentage": 60.59, "elapsed_time": "1 day, 1:41:11", "remaining_time": "16:42:33", "throughput": 332.02, "total_tokens": 30701952} {"current_steps": 24240, "total_steps": 40000, "loss": 0.0447, "lr": 0.10097792946503102, "epoch": 1.1843988957564802, "percentage": 60.6, "elapsed_time": "1 day, 1:41:14", "remaining_time": "16:42:03", "throughput": 332.08, "total_tokens": 30708576} {"current_steps": 24245, "total_steps": 40000, "loss": 0.074, "lr": 0.10092226292397039, "epoch": 1.1846431974201743, "percentage": 60.61, "elapsed_time": "1 day, 1:41:17", "remaining_time": "16:41:34", "throughput": 332.13, "total_tokens": 30714528} {"current_steps": 24250, "total_steps": 40000, "loss": 0.0722, "lr": 0.10086660395131354, "epoch": 1.1848874990838687, "percentage": 60.62, "elapsed_time": "1 day, 1:41:20", "remaining_time": "16:41:04", "throughput": 332.19, "total_tokens": 30720864} {"current_steps": 24255, "total_steps": 40000, "loss": 0.0652, "lr": 0.10081095255564385, "epoch": 1.185131800747563, "percentage": 60.64, "elapsed_time": "1 day, 1:41:23", "remaining_time": "16:40:35", "throughput": 332.25, "total_tokens": 30727712} {"current_steps": 24260, "total_steps": 40000, "loss": 0.05, "lr": 0.10075530874554335, "epoch": 1.1853761024112575, "percentage": 60.65, "elapsed_time": "1 day, 1:41:26", "remaining_time": "16:40:05", "throughput": 332.31, "total_tokens": 30733952} {"current_steps": 24265, "total_steps": 40000, "loss": 0.0352, "lr": 0.10069967252959311, "epoch": 1.1856204040749518, "percentage": 60.66, "elapsed_time": "1 day, 1:41:29", "remaining_time": "16:39:36", "throughput": 332.36, "total_tokens": 30740032} {"current_steps": 24270, "total_steps": 40000, "loss": 0.0548, "lr": 0.10064404391637297, "epoch": 1.185864705738646, "percentage": 60.68, "elapsed_time": "1 day, 1:41:32", "remaining_time": "16:39:06", "throughput": 332.42, "total_tokens": 30746304} {"current_steps": 24275, "total_steps": 40000, "loss": 0.057, "lr": 0.10058842291446145, "epoch": 1.1861090074023404, "percentage": 60.69, "elapsed_time": "1 day, 1:41:35", "remaining_time": "16:38:37", "throughput": 332.48, "total_tokens": 30752896} {"current_steps": 24280, "total_steps": 40000, "loss": 0.0219, "lr": 0.10053280953243608, "epoch": 1.1863533090660348, "percentage": 60.7, "elapsed_time": "1 day, 1:41:39", "remaining_time": "16:38:08", "throughput": 332.53, "total_tokens": 30758912} {"current_steps": 24285, "total_steps": 40000, "loss": 0.0615, "lr": 0.10047720377887315, "epoch": 1.1865976107297291, "percentage": 60.71, "elapsed_time": "1 day, 1:41:42", "remaining_time": "16:37:38", "throughput": 332.59, "total_tokens": 30764896} {"current_steps": 24290, "total_steps": 40000, "loss": 0.069, "lr": 0.10042160566234767, "epoch": 1.1868419123934233, "percentage": 60.72, "elapsed_time": "1 day, 1:41:45", "remaining_time": "16:37:09", "throughput": 332.64, "total_tokens": 30770944} {"current_steps": 24295, "total_steps": 40000, "loss": 0.0806, "lr": 0.10036601519143372, "epoch": 1.1870862140571177, "percentage": 60.74, "elapsed_time": "1 day, 1:41:48", "remaining_time": "16:36:39", "throughput": 332.69, "total_tokens": 30776832} {"current_steps": 24300, "total_steps": 40000, "loss": 0.0484, "lr": 0.1003104323747039, "epoch": 1.187330515720812, "percentage": 60.75, "elapsed_time": "1 day, 1:41:51", "remaining_time": "16:36:10", "throughput": 332.75, "total_tokens": 30783392} {"current_steps": 24305, "total_steps": 40000, "loss": 0.0453, "lr": 0.10025485722072984, "epoch": 1.1875748173845064, "percentage": 60.76, "elapsed_time": "1 day, 1:41:54", "remaining_time": "16:35:41", "throughput": 332.81, "total_tokens": 30789440} {"current_steps": 24310, "total_steps": 40000, "loss": 0.0684, "lr": 0.10019928973808201, "epoch": 1.1878191190482008, "percentage": 60.77, "elapsed_time": "1 day, 1:41:57", "remaining_time": "16:35:11", "throughput": 332.86, "total_tokens": 30795552} {"current_steps": 24315, "total_steps": 40000, "loss": 0.0733, "lr": 0.10014372993532945, "epoch": 1.188063420711895, "percentage": 60.79, "elapsed_time": "1 day, 1:42:00", "remaining_time": "16:34:42", "throughput": 332.92, "total_tokens": 30801632} {"current_steps": 24320, "total_steps": 40000, "loss": 0.0683, "lr": 0.1000881778210403, "epoch": 1.1883077223755893, "percentage": 60.8, "elapsed_time": "1 day, 1:42:03", "remaining_time": "16:34:13", "throughput": 332.98, "total_tokens": 30808000} {"current_steps": 24325, "total_steps": 40000, "loss": 0.079, "lr": 0.10003263340378142, "epoch": 1.1885520240392837, "percentage": 60.81, "elapsed_time": "1 day, 1:42:06", "remaining_time": "16:33:44", "throughput": 333.04, "total_tokens": 30814656} {"current_steps": 24330, "total_steps": 40000, "loss": 0.0537, "lr": 0.09997709669211834, "epoch": 1.188796325702978, "percentage": 60.82, "elapsed_time": "1 day, 1:42:09", "remaining_time": "16:33:14", "throughput": 333.1, "total_tokens": 30821472} {"current_steps": 24335, "total_steps": 40000, "loss": 0.0509, "lr": 0.0999215676946156, "epoch": 1.1890406273666723, "percentage": 60.84, "elapsed_time": "1 day, 1:42:12", "remaining_time": "16:32:45", "throughput": 333.16, "total_tokens": 30827872} {"current_steps": 24340, "total_steps": 40000, "loss": 0.0808, "lr": 0.0998660464198364, "epoch": 1.1892849290303666, "percentage": 60.85, "elapsed_time": "1 day, 1:42:15", "remaining_time": "16:32:16", "throughput": 333.21, "total_tokens": 30834144} {"current_steps": 24345, "total_steps": 40000, "loss": 0.0508, "lr": 0.09981053287634288, "epoch": 1.189529230694061, "percentage": 60.86, "elapsed_time": "1 day, 1:42:19", "remaining_time": "16:31:47", "throughput": 333.27, "total_tokens": 30840448} {"current_steps": 24350, "total_steps": 40000, "loss": 0.0519, "lr": 0.09975502707269596, "epoch": 1.1897735323577554, "percentage": 60.88, "elapsed_time": "1 day, 1:42:22", "remaining_time": "16:31:17", "throughput": 333.33, "total_tokens": 30846944} {"current_steps": 24355, "total_steps": 40000, "loss": 0.0414, "lr": 0.09969952901745524, "epoch": 1.1900178340214498, "percentage": 60.89, "elapsed_time": "1 day, 1:42:25", "remaining_time": "16:30:48", "throughput": 333.38, "total_tokens": 30853120} {"current_steps": 24360, "total_steps": 40000, "loss": 0.0409, "lr": 0.09964403871917925, "epoch": 1.190262135685144, "percentage": 60.9, "elapsed_time": "1 day, 1:42:28", "remaining_time": "16:30:19", "throughput": 333.44, "total_tokens": 30859488} {"current_steps": 24365, "total_steps": 40000, "loss": 0.0552, "lr": 0.09958855618642536, "epoch": 1.1905064373488383, "percentage": 60.91, "elapsed_time": "1 day, 1:42:31", "remaining_time": "16:29:50", "throughput": 333.5, "total_tokens": 30865632} {"current_steps": 24370, "total_steps": 40000, "loss": 0.0565, "lr": 0.09953308142774955, "epoch": 1.1907507390125327, "percentage": 60.92, "elapsed_time": "1 day, 1:42:34", "remaining_time": "16:29:20", "throughput": 333.55, "total_tokens": 30871488} {"current_steps": 24375, "total_steps": 40000, "loss": 0.0476, "lr": 0.09947761445170686, "epoch": 1.190995040676227, "percentage": 60.94, "elapsed_time": "1 day, 1:42:37", "remaining_time": "16:28:51", "throughput": 333.6, "total_tokens": 30877504} {"current_steps": 24380, "total_steps": 40000, "loss": 0.0734, "lr": 0.09942215526685086, "epoch": 1.1912393423399212, "percentage": 60.95, "elapsed_time": "1 day, 1:42:40", "remaining_time": "16:28:22", "throughput": 333.66, "total_tokens": 30883744} {"current_steps": 24385, "total_steps": 40000, "loss": 0.0668, "lr": 0.09936670388173414, "epoch": 1.1914836440036156, "percentage": 60.96, "elapsed_time": "1 day, 1:42:43", "remaining_time": "16:27:53", "throughput": 333.71, "total_tokens": 30889632} {"current_steps": 24390, "total_steps": 40000, "loss": 0.0541, "lr": 0.09931126030490799, "epoch": 1.19172794566731, "percentage": 60.98, "elapsed_time": "1 day, 1:42:46", "remaining_time": "16:27:24", "throughput": 333.77, "total_tokens": 30895840} {"current_steps": 24395, "total_steps": 40000, "loss": 0.0399, "lr": 0.0992558245449225, "epoch": 1.1919722473310044, "percentage": 60.99, "elapsed_time": "1 day, 1:42:49", "remaining_time": "16:26:54", "throughput": 333.83, "total_tokens": 30902016} {"current_steps": 24400, "total_steps": 40000, "loss": 0.0816, "lr": 0.09920039661032651, "epoch": 1.1922165489946988, "percentage": 61.0, "elapsed_time": "1 day, 1:42:52", "remaining_time": "16:26:25", "throughput": 333.88, "total_tokens": 30908480} {"current_steps": 24400, "total_steps": 40000, "eval_loss": 0.06651005893945694, "epoch": 1.1922165489946988, "percentage": 61.0, "elapsed_time": "1 day, 1:53:33", "remaining_time": "16:33:15", "throughput": 331.59, "total_tokens": 30908480} {"current_steps": 24405, "total_steps": 40000, "loss": 0.0787, "lr": 0.09914497650966782, "epoch": 1.192460850658393, "percentage": 61.01, "elapsed_time": "1 day, 1:53:36", "remaining_time": "16:32:46", "throughput": 331.65, "total_tokens": 30915264} {"current_steps": 24410, "total_steps": 40000, "loss": 0.0447, "lr": 0.09908956425149276, "epoch": 1.1927051523220873, "percentage": 61.02, "elapsed_time": "1 day, 1:53:40", "remaining_time": "16:32:17", "throughput": 331.7, "total_tokens": 30921504} {"current_steps": 24415, "total_steps": 40000, "loss": 0.0422, "lr": 0.09903415984434677, "epoch": 1.1929494539857817, "percentage": 61.04, "elapsed_time": "1 day, 1:53:43", "remaining_time": "16:31:47", "throughput": 331.76, "total_tokens": 30928032} {"current_steps": 24420, "total_steps": 40000, "loss": 0.0513, "lr": 0.09897876329677373, "epoch": 1.193193755649476, "percentage": 61.05, "elapsed_time": "1 day, 1:53:46", "remaining_time": "16:31:18", "throughput": 331.82, "total_tokens": 30934176} {"current_steps": 24425, "total_steps": 40000, "loss": 0.0772, "lr": 0.09892337461731658, "epoch": 1.1934380573131702, "percentage": 61.06, "elapsed_time": "1 day, 1:53:49", "remaining_time": "16:30:49", "throughput": 331.87, "total_tokens": 30940256} {"current_steps": 24430, "total_steps": 40000, "loss": 0.1059, "lr": 0.09886799381451693, "epoch": 1.1936823589768646, "percentage": 61.08, "elapsed_time": "1 day, 1:53:52", "remaining_time": "16:30:19", "throughput": 331.93, "total_tokens": 30946240} {"current_steps": 24435, "total_steps": 40000, "loss": 0.0698, "lr": 0.09881262089691521, "epoch": 1.193926660640559, "percentage": 61.09, "elapsed_time": "1 day, 1:53:55", "remaining_time": "16:29:50", "throughput": 331.98, "total_tokens": 30952320} {"current_steps": 24440, "total_steps": 40000, "loss": 0.059, "lr": 0.09875725587305059, "epoch": 1.1941709623042533, "percentage": 61.1, "elapsed_time": "1 day, 1:53:58", "remaining_time": "16:29:21", "throughput": 332.04, "total_tokens": 30958560} {"current_steps": 24445, "total_steps": 40000, "loss": 0.0572, "lr": 0.09870189875146111, "epoch": 1.1944152639679477, "percentage": 61.11, "elapsed_time": "1 day, 1:54:01", "remaining_time": "16:28:51", "throughput": 332.09, "total_tokens": 30964992} {"current_steps": 24450, "total_steps": 40000, "loss": 0.0443, "lr": 0.09864654954068346, "epoch": 1.1946595656316419, "percentage": 61.12, "elapsed_time": "1 day, 1:54:04", "remaining_time": "16:28:22", "throughput": 332.15, "total_tokens": 30971200} {"current_steps": 24455, "total_steps": 40000, "loss": 0.0701, "lr": 0.09859120824925326, "epoch": 1.1949038672953363, "percentage": 61.14, "elapsed_time": "1 day, 1:54:07", "remaining_time": "16:27:53", "throughput": 332.21, "total_tokens": 30977536} {"current_steps": 24460, "total_steps": 40000, "loss": 0.0516, "lr": 0.09853587488570474, "epoch": 1.1951481689590306, "percentage": 61.15, "elapsed_time": "1 day, 1:54:10", "remaining_time": "16:27:24", "throughput": 332.27, "total_tokens": 30984096} {"current_steps": 24465, "total_steps": 40000, "loss": 0.0475, "lr": 0.09848054945857107, "epoch": 1.195392470622725, "percentage": 61.16, "elapsed_time": "1 day, 1:54:13", "remaining_time": "16:26:55", "throughput": 332.32, "total_tokens": 30990240} {"current_steps": 24470, "total_steps": 40000, "loss": 0.0598, "lr": 0.09842523197638416, "epoch": 1.1956367722864192, "percentage": 61.18, "elapsed_time": "1 day, 1:54:16", "remaining_time": "16:26:25", "throughput": 332.39, "total_tokens": 30997312} {"current_steps": 24475, "total_steps": 40000, "loss": 0.0719, "lr": 0.09836992244767452, "epoch": 1.1958810739501136, "percentage": 61.19, "elapsed_time": "1 day, 1:54:20", "remaining_time": "16:25:56", "throughput": 332.44, "total_tokens": 31003584} {"current_steps": 24480, "total_steps": 40000, "loss": 0.0631, "lr": 0.09831462088097168, "epoch": 1.196125375613808, "percentage": 61.2, "elapsed_time": "1 day, 1:54:22", "remaining_time": "16:25:27", "throughput": 332.49, "total_tokens": 31009248} {"current_steps": 24485, "total_steps": 40000, "loss": 0.0765, "lr": 0.09825932728480385, "epoch": 1.1963696772775023, "percentage": 61.21, "elapsed_time": "1 day, 1:54:26", "remaining_time": "16:24:58", "throughput": 332.55, "total_tokens": 31015424} {"current_steps": 24490, "total_steps": 40000, "loss": 0.0754, "lr": 0.09820404166769794, "epoch": 1.1966139789411967, "percentage": 61.22, "elapsed_time": "1 day, 1:54:29", "remaining_time": "16:24:29", "throughput": 332.6, "total_tokens": 31021760} {"current_steps": 24495, "total_steps": 40000, "loss": 0.0831, "lr": 0.09814876403817978, "epoch": 1.1968582806048909, "percentage": 61.24, "elapsed_time": "1 day, 1:54:32", "remaining_time": "16:24:00", "throughput": 332.66, "total_tokens": 31028288} {"current_steps": 24500, "total_steps": 40000, "loss": 0.0335, "lr": 0.09809349440477376, "epoch": 1.1971025822685852, "percentage": 61.25, "elapsed_time": "1 day, 1:54:35", "remaining_time": "16:23:30", "throughput": 332.72, "total_tokens": 31034720} {"current_steps": 24505, "total_steps": 40000, "loss": 0.1024, "lr": 0.09803823277600317, "epoch": 1.1973468839322796, "percentage": 61.26, "elapsed_time": "1 day, 1:54:38", "remaining_time": "16:23:01", "throughput": 332.77, "total_tokens": 31040576} {"current_steps": 24510, "total_steps": 40000, "loss": 0.0432, "lr": 0.09798297916039014, "epoch": 1.197591185595974, "percentage": 61.27, "elapsed_time": "1 day, 1:54:41", "remaining_time": "16:22:32", "throughput": 332.83, "total_tokens": 31046720} {"current_steps": 24515, "total_steps": 40000, "loss": 0.0503, "lr": 0.09792773356645534, "epoch": 1.1978354872596682, "percentage": 61.29, "elapsed_time": "1 day, 1:54:44", "remaining_time": "16:22:03", "throughput": 332.89, "total_tokens": 31053536} {"current_steps": 24520, "total_steps": 40000, "loss": 0.0689, "lr": 0.09787249600271843, "epoch": 1.1980797889233625, "percentage": 61.3, "elapsed_time": "1 day, 1:54:47", "remaining_time": "16:21:34", "throughput": 332.95, "total_tokens": 31060224} {"current_steps": 24525, "total_steps": 40000, "loss": 0.0651, "lr": 0.09781726647769776, "epoch": 1.198324090587057, "percentage": 61.31, "elapsed_time": "1 day, 1:54:50", "remaining_time": "16:21:05", "throughput": 333.0, "total_tokens": 31065952} {"current_steps": 24530, "total_steps": 40000, "loss": 0.0754, "lr": 0.0977620449999103, "epoch": 1.1985683922507513, "percentage": 61.32, "elapsed_time": "1 day, 1:54:53", "remaining_time": "16:20:36", "throughput": 333.06, "total_tokens": 31072896} {"current_steps": 24535, "total_steps": 40000, "loss": 0.0615, "lr": 0.09770683157787204, "epoch": 1.1988126939144457, "percentage": 61.34, "elapsed_time": "1 day, 1:54:56", "remaining_time": "16:20:07", "throughput": 333.12, "total_tokens": 31078816} {"current_steps": 24540, "total_steps": 40000, "loss": 0.0369, "lr": 0.09765162622009745, "epoch": 1.1990569955781398, "percentage": 61.35, "elapsed_time": "1 day, 1:55:00", "remaining_time": "16:19:38", "throughput": 333.18, "total_tokens": 31085280} {"current_steps": 24545, "total_steps": 40000, "loss": 0.0566, "lr": 0.09759642893509995, "epoch": 1.1993012972418342, "percentage": 61.36, "elapsed_time": "1 day, 1:55:03", "remaining_time": "16:19:09", "throughput": 333.23, "total_tokens": 31091552} {"current_steps": 24550, "total_steps": 40000, "loss": 0.0479, "lr": 0.09754123973139169, "epoch": 1.1995455989055286, "percentage": 61.38, "elapsed_time": "1 day, 1:55:06", "remaining_time": "16:18:40", "throughput": 333.29, "total_tokens": 31098272} {"current_steps": 24555, "total_steps": 40000, "loss": 0.0501, "lr": 0.09748605861748345, "epoch": 1.199789900569223, "percentage": 61.39, "elapsed_time": "1 day, 1:55:09", "remaining_time": "16:18:11", "throughput": 333.35, "total_tokens": 31104576} {"current_steps": 24560, "total_steps": 40000, "loss": 0.0472, "lr": 0.0974308856018849, "epoch": 1.2000342022329171, "percentage": 61.4, "elapsed_time": "1 day, 1:55:12", "remaining_time": "16:17:42", "throughput": 333.4, "total_tokens": 31110624} {"current_steps": 24565, "total_steps": 40000, "loss": 0.0462, "lr": 0.09737572069310449, "epoch": 1.2002785038966115, "percentage": 61.41, "elapsed_time": "1 day, 1:55:15", "remaining_time": "16:17:13", "throughput": 333.46, "total_tokens": 31116896} {"current_steps": 24570, "total_steps": 40000, "loss": 0.0955, "lr": 0.09732056389964922, "epoch": 1.2005228055603059, "percentage": 61.42, "elapsed_time": "1 day, 1:55:18", "remaining_time": "16:16:44", "throughput": 333.52, "total_tokens": 31123264} {"current_steps": 24575, "total_steps": 40000, "loss": 0.0407, "lr": 0.097265415230025, "epoch": 1.2007671072240003, "percentage": 61.44, "elapsed_time": "1 day, 1:55:21", "remaining_time": "16:16:15", "throughput": 333.58, "total_tokens": 31129984} {"current_steps": 24580, "total_steps": 40000, "loss": 0.0612, "lr": 0.09721027469273648, "epoch": 1.2010114088876946, "percentage": 61.45, "elapsed_time": "1 day, 1:55:24", "remaining_time": "16:15:46", "throughput": 333.63, "total_tokens": 31135904} {"current_steps": 24585, "total_steps": 40000, "loss": 0.0665, "lr": 0.09715514229628695, "epoch": 1.2012557105513888, "percentage": 61.46, "elapsed_time": "1 day, 1:55:28", "remaining_time": "16:15:17", "throughput": 333.7, "total_tokens": 31143712} {"current_steps": 24590, "total_steps": 40000, "loss": 0.0387, "lr": 0.09710001804917864, "epoch": 1.2015000122150832, "percentage": 61.48, "elapsed_time": "1 day, 1:55:31", "remaining_time": "16:14:48", "throughput": 333.75, "total_tokens": 31149696} {"current_steps": 24595, "total_steps": 40000, "loss": 0.0584, "lr": 0.09704490195991226, "epoch": 1.2017443138787776, "percentage": 61.49, "elapsed_time": "1 day, 1:55:34", "remaining_time": "16:14:19", "throughput": 333.81, "total_tokens": 31155936} {"current_steps": 24600, "total_steps": 40000, "loss": 0.111, "lr": 0.09698979403698753, "epoch": 1.201988615542472, "percentage": 61.5, "elapsed_time": "1 day, 1:55:37", "remaining_time": "16:13:50", "throughput": 333.87, "total_tokens": 31162176} {"current_steps": 24600, "total_steps": 40000, "eval_loss": 0.06342479586601257, "epoch": 1.201988615542472, "percentage": 61.5, "elapsed_time": "1 day, 2:06:17", "remaining_time": "16:20:31", "throughput": 331.59, "total_tokens": 31162176} {"current_steps": 24605, "total_steps": 40000, "loss": 0.0523, "lr": 0.0969346942889027, "epoch": 1.202232917206166, "percentage": 61.51, "elapsed_time": "1 day, 2:06:21", "remaining_time": "16:20:02", "throughput": 331.65, "total_tokens": 31168640} {"current_steps": 24610, "total_steps": 40000, "loss": 0.0563, "lr": 0.09687960272415487, "epoch": 1.2024772188698605, "percentage": 61.52, "elapsed_time": "1 day, 2:06:24", "remaining_time": "16:19:33", "throughput": 331.7, "total_tokens": 31175040} {"current_steps": 24615, "total_steps": 40000, "loss": 0.097, "lr": 0.0968245193512399, "epoch": 1.2027215205335549, "percentage": 61.54, "elapsed_time": "1 day, 2:06:27", "remaining_time": "16:19:04", "throughput": 331.75, "total_tokens": 31180768} {"current_steps": 24620, "total_steps": 40000, "loss": 0.0366, "lr": 0.09676944417865221, "epoch": 1.2029658221972492, "percentage": 61.55, "elapsed_time": "1 day, 2:06:30", "remaining_time": "16:18:35", "throughput": 331.81, "total_tokens": 31187104} {"current_steps": 24625, "total_steps": 40000, "loss": 0.0407, "lr": 0.09671437721488517, "epoch": 1.2032101238609436, "percentage": 61.56, "elapsed_time": "1 day, 2:06:33", "remaining_time": "16:18:06", "throughput": 331.87, "total_tokens": 31193536} {"current_steps": 24630, "total_steps": 40000, "loss": 0.0427, "lr": 0.09665931846843086, "epoch": 1.2034544255246378, "percentage": 61.58, "elapsed_time": "1 day, 2:06:37", "remaining_time": "16:17:37", "throughput": 331.93, "total_tokens": 31200800} {"current_steps": 24635, "total_steps": 40000, "loss": 0.0841, "lr": 0.0966042679477799, "epoch": 1.2036987271883322, "percentage": 61.59, "elapsed_time": "1 day, 2:06:40", "remaining_time": "16:17:08", "throughput": 331.99, "total_tokens": 31207488} {"current_steps": 24640, "total_steps": 40000, "loss": 0.0666, "lr": 0.09654922566142186, "epoch": 1.2039430288520265, "percentage": 61.6, "elapsed_time": "1 day, 2:06:43", "remaining_time": "16:16:39", "throughput": 332.05, "total_tokens": 31213856} {"current_steps": 24645, "total_steps": 40000, "loss": 0.075, "lr": 0.09649419161784498, "epoch": 1.2041873305157207, "percentage": 61.61, "elapsed_time": "1 day, 2:06:46", "remaining_time": "16:16:10", "throughput": 332.1, "total_tokens": 31219840} {"current_steps": 24650, "total_steps": 40000, "loss": 0.0429, "lr": 0.09643916582553606, "epoch": 1.204431632179415, "percentage": 61.62, "elapsed_time": "1 day, 2:06:49", "remaining_time": "16:15:41", "throughput": 332.17, "total_tokens": 31226880} {"current_steps": 24655, "total_steps": 40000, "loss": 0.0653, "lr": 0.09638414829298093, "epoch": 1.2046759338431094, "percentage": 61.64, "elapsed_time": "1 day, 2:06:52", "remaining_time": "16:15:12", "throughput": 332.23, "total_tokens": 31233728} {"current_steps": 24660, "total_steps": 40000, "loss": 0.0318, "lr": 0.09632913902866386, "epoch": 1.2049202355068038, "percentage": 61.65, "elapsed_time": "1 day, 2:06:55", "remaining_time": "16:14:43", "throughput": 332.29, "total_tokens": 31240128} {"current_steps": 24665, "total_steps": 40000, "loss": 0.0845, "lr": 0.096274138041068, "epoch": 1.2051645371704982, "percentage": 61.66, "elapsed_time": "1 day, 2:06:59", "remaining_time": "16:14:14", "throughput": 332.34, "total_tokens": 31246272} {"current_steps": 24670, "total_steps": 40000, "loss": 0.0653, "lr": 0.09621914533867527, "epoch": 1.2054088388341924, "percentage": 61.68, "elapsed_time": "1 day, 2:07:02", "remaining_time": "16:13:45", "throughput": 332.4, "total_tokens": 31252800} {"current_steps": 24675, "total_steps": 40000, "loss": 0.0787, "lr": 0.09616416092996616, "epoch": 1.2056531404978867, "percentage": 61.69, "elapsed_time": "1 day, 2:07:05", "remaining_time": "16:13:16", "throughput": 332.46, "total_tokens": 31259168} {"current_steps": 24680, "total_steps": 40000, "loss": 0.059, "lr": 0.09610918482342, "epoch": 1.2058974421615811, "percentage": 61.7, "elapsed_time": "1 day, 2:07:08", "remaining_time": "16:12:47", "throughput": 332.51, "total_tokens": 31265312} {"current_steps": 24685, "total_steps": 40000, "loss": 0.0585, "lr": 0.09605421702751478, "epoch": 1.2061417438252755, "percentage": 61.71, "elapsed_time": "1 day, 2:07:11", "remaining_time": "16:12:18", "throughput": 332.56, "total_tokens": 31270816} {"current_steps": 24690, "total_steps": 40000, "loss": 0.045, "lr": 0.09599925755072718, "epoch": 1.2063860454889697, "percentage": 61.72, "elapsed_time": "1 day, 2:07:14", "remaining_time": "16:11:49", "throughput": 332.61, "total_tokens": 31277184} {"current_steps": 24695, "total_steps": 40000, "loss": 0.0462, "lr": 0.09594430640153273, "epoch": 1.206630347152664, "percentage": 61.74, "elapsed_time": "1 day, 2:07:17", "remaining_time": "16:11:20", "throughput": 332.67, "total_tokens": 31283392} {"current_steps": 24700, "total_steps": 40000, "loss": 0.0907, "lr": 0.09588936358840547, "epoch": 1.2068746488163584, "percentage": 61.75, "elapsed_time": "1 day, 2:07:20", "remaining_time": "16:10:51", "throughput": 332.72, "total_tokens": 31289600} {"current_steps": 24705, "total_steps": 40000, "loss": 0.0526, "lr": 0.09583442911981836, "epoch": 1.2071189504800528, "percentage": 61.76, "elapsed_time": "1 day, 2:07:23", "remaining_time": "16:10:22", "throughput": 332.78, "total_tokens": 31296256} {"current_steps": 24710, "total_steps": 40000, "loss": 0.0528, "lr": 0.09577950300424302, "epoch": 1.2073632521437472, "percentage": 61.78, "elapsed_time": "1 day, 2:07:26", "remaining_time": "16:09:53", "throughput": 332.83, "total_tokens": 31301952} {"current_steps": 24715, "total_steps": 40000, "loss": 0.0509, "lr": 0.09572458525014967, "epoch": 1.2076075538074413, "percentage": 61.79, "elapsed_time": "1 day, 2:07:29", "remaining_time": "16:09:25", "throughput": 332.89, "total_tokens": 31308032} {"current_steps": 24720, "total_steps": 40000, "loss": 0.0944, "lr": 0.0956696758660073, "epoch": 1.2078518554711357, "percentage": 61.8, "elapsed_time": "1 day, 2:07:32", "remaining_time": "16:08:56", "throughput": 332.94, "total_tokens": 31314272} {"current_steps": 24725, "total_steps": 40000, "loss": 0.0653, "lr": 0.09561477486028373, "epoch": 1.20809615713483, "percentage": 61.81, "elapsed_time": "1 day, 2:07:35", "remaining_time": "16:08:27", "throughput": 333.0, "total_tokens": 31320576} {"current_steps": 24730, "total_steps": 40000, "loss": 0.0653, "lr": 0.09555988224144528, "epoch": 1.2083404587985245, "percentage": 61.82, "elapsed_time": "1 day, 2:07:38", "remaining_time": "16:07:58", "throughput": 333.06, "total_tokens": 31326816} {"current_steps": 24735, "total_steps": 40000, "loss": 0.0548, "lr": 0.09550499801795717, "epoch": 1.2085847604622186, "percentage": 61.84, "elapsed_time": "1 day, 2:07:41", "remaining_time": "16:07:29", "throughput": 333.11, "total_tokens": 31333056} {"current_steps": 24740, "total_steps": 40000, "loss": 0.0703, "lr": 0.09545012219828314, "epoch": 1.208829062125913, "percentage": 61.85, "elapsed_time": "1 day, 2:07:45", "remaining_time": "16:07:00", "throughput": 333.17, "total_tokens": 31339488} {"current_steps": 24745, "total_steps": 40000, "loss": 0.0615, "lr": 0.09539525479088577, "epoch": 1.2090733637896074, "percentage": 61.86, "elapsed_time": "1 day, 2:07:48", "remaining_time": "16:06:31", "throughput": 333.22, "total_tokens": 31345408} {"current_steps": 24750, "total_steps": 40000, "loss": 0.0978, "lr": 0.0953403958042264, "epoch": 1.2093176654533018, "percentage": 61.88, "elapsed_time": "1 day, 2:07:51", "remaining_time": "16:06:03", "throughput": 333.28, "total_tokens": 31351648} {"current_steps": 24755, "total_steps": 40000, "loss": 0.035, "lr": 0.09528554524676484, "epoch": 1.2095619671169962, "percentage": 61.89, "elapsed_time": "1 day, 2:07:54", "remaining_time": "16:05:34", "throughput": 333.33, "total_tokens": 31358144} {"current_steps": 24760, "total_steps": 40000, "loss": 0.083, "lr": 0.09523070312695978, "epoch": 1.2098062687806903, "percentage": 61.9, "elapsed_time": "1 day, 2:07:57", "remaining_time": "16:05:05", "throughput": 333.39, "total_tokens": 31364288} {"current_steps": 24765, "total_steps": 40000, "loss": 0.0759, "lr": 0.09517586945326863, "epoch": 1.2100505704443847, "percentage": 61.91, "elapsed_time": "1 day, 2:08:00", "remaining_time": "16:04:36", "throughput": 333.44, "total_tokens": 31370336} {"current_steps": 24770, "total_steps": 40000, "loss": 0.0631, "lr": 0.0951210442341473, "epoch": 1.210294872108079, "percentage": 61.92, "elapsed_time": "1 day, 2:08:03", "remaining_time": "16:04:07", "throughput": 333.49, "total_tokens": 31376320} {"current_steps": 24775, "total_steps": 40000, "loss": 0.0327, "lr": 0.09506622747805066, "epoch": 1.2105391737717734, "percentage": 61.94, "elapsed_time": "1 day, 2:08:06", "remaining_time": "16:03:38", "throughput": 333.55, "total_tokens": 31382240} {"current_steps": 24780, "total_steps": 40000, "loss": 0.0883, "lr": 0.09501141919343203, "epoch": 1.2107834754354676, "percentage": 61.95, "elapsed_time": "1 day, 2:08:09", "remaining_time": "16:03:10", "throughput": 333.6, "total_tokens": 31388160} {"current_steps": 24785, "total_steps": 40000, "loss": 0.0666, "lr": 0.09495661938874361, "epoch": 1.211027777099162, "percentage": 61.96, "elapsed_time": "1 day, 2:08:12", "remaining_time": "16:02:41", "throughput": 333.65, "total_tokens": 31394112} {"current_steps": 24790, "total_steps": 40000, "loss": 0.0712, "lr": 0.0949018280724362, "epoch": 1.2112720787628564, "percentage": 61.98, "elapsed_time": "1 day, 2:08:15", "remaining_time": "16:02:12", "throughput": 333.71, "total_tokens": 31400224} {"current_steps": 24795, "total_steps": 40000, "loss": 0.0608, "lr": 0.09484704525295934, "epoch": 1.2115163804265507, "percentage": 61.99, "elapsed_time": "1 day, 2:08:18", "remaining_time": "16:01:43", "throughput": 333.76, "total_tokens": 31406528} {"current_steps": 24800, "total_steps": 40000, "loss": 0.0691, "lr": 0.09479227093876112, "epoch": 1.2117606820902451, "percentage": 62.0, "elapsed_time": "1 day, 2:08:21", "remaining_time": "16:01:15", "throughput": 333.82, "total_tokens": 31412736} {"current_steps": 24800, "total_steps": 40000, "eval_loss": 0.0638032853603363, "epoch": 1.2117606820902451, "percentage": 62.0, "elapsed_time": "1 day, 2:19:02", "remaining_time": "16:07:47", "throughput": 331.56, "total_tokens": 31412736} {"current_steps": 24805, "total_steps": 40000, "loss": 0.057, "lr": 0.0947375051382886, "epoch": 1.2120049837539393, "percentage": 62.01, "elapsed_time": "1 day, 2:19:05", "remaining_time": "16:07:19", "throughput": 331.61, "total_tokens": 31419040} {"current_steps": 24810, "total_steps": 40000, "loss": 0.041, "lr": 0.09468274785998718, "epoch": 1.2122492854176337, "percentage": 62.02, "elapsed_time": "1 day, 2:19:09", "remaining_time": "16:06:50", "throughput": 331.67, "total_tokens": 31425376} {"current_steps": 24815, "total_steps": 40000, "loss": 0.0689, "lr": 0.09462799911230127, "epoch": 1.212493587081328, "percentage": 62.04, "elapsed_time": "1 day, 2:19:12", "remaining_time": "16:06:21", "throughput": 331.73, "total_tokens": 31431904} {"current_steps": 24820, "total_steps": 40000, "loss": 0.0504, "lr": 0.0945732589036737, "epoch": 1.2127378887450224, "percentage": 62.05, "elapsed_time": "1 day, 2:19:15", "remaining_time": "16:05:52", "throughput": 331.78, "total_tokens": 31438176} {"current_steps": 24825, "total_steps": 40000, "loss": 0.0569, "lr": 0.09451852724254614, "epoch": 1.2129821904087166, "percentage": 62.06, "elapsed_time": "1 day, 2:19:18", "remaining_time": "16:05:23", "throughput": 331.84, "total_tokens": 31444608} {"current_steps": 24830, "total_steps": 40000, "loss": 0.0529, "lr": 0.09446380413735894, "epoch": 1.213226492072411, "percentage": 62.08, "elapsed_time": "1 day, 2:19:21", "remaining_time": "16:04:54", "throughput": 331.9, "total_tokens": 31451104} {"current_steps": 24835, "total_steps": 40000, "loss": 0.0585, "lr": 0.09440908959655099, "epoch": 1.2134707937361053, "percentage": 62.09, "elapsed_time": "1 day, 2:19:24", "remaining_time": "16:04:26", "throughput": 331.95, "total_tokens": 31457440} {"current_steps": 24840, "total_steps": 40000, "loss": 0.0712, "lr": 0.09435438362856004, "epoch": 1.2137150953997997, "percentage": 62.1, "elapsed_time": "1 day, 2:19:27", "remaining_time": "16:03:57", "throughput": 332.01, "total_tokens": 31463872} {"current_steps": 24845, "total_steps": 40000, "loss": 0.0453, "lr": 0.0942996862418225, "epoch": 1.213959397063494, "percentage": 62.11, "elapsed_time": "1 day, 2:19:30", "remaining_time": "16:03:28", "throughput": 332.07, "total_tokens": 31470848} {"current_steps": 24850, "total_steps": 40000, "loss": 0.0253, "lr": 0.09424499744477322, "epoch": 1.2142036987271883, "percentage": 62.12, "elapsed_time": "1 day, 2:19:34", "remaining_time": "16:02:59", "throughput": 332.13, "total_tokens": 31477248} {"current_steps": 24855, "total_steps": 40000, "loss": 0.0622, "lr": 0.09419031724584608, "epoch": 1.2144480003908826, "percentage": 62.14, "elapsed_time": "1 day, 2:19:37", "remaining_time": "16:02:30", "throughput": 332.18, "total_tokens": 31483456} {"current_steps": 24860, "total_steps": 40000, "loss": 0.0452, "lr": 0.09413564565347331, "epoch": 1.214692302054577, "percentage": 62.15, "elapsed_time": "1 day, 2:19:40", "remaining_time": "16:02:02", "throughput": 332.24, "total_tokens": 31489440} {"current_steps": 24865, "total_steps": 40000, "loss": 0.0591, "lr": 0.094080982676086, "epoch": 1.2149366037182714, "percentage": 62.16, "elapsed_time": "1 day, 2:19:43", "remaining_time": "16:01:33", "throughput": 332.29, "total_tokens": 31495680} {"current_steps": 24870, "total_steps": 40000, "loss": 0.0674, "lr": 0.09402632832211395, "epoch": 1.2151809053819655, "percentage": 62.18, "elapsed_time": "1 day, 2:19:46", "remaining_time": "16:01:04", "throughput": 332.35, "total_tokens": 31501920} {"current_steps": 24875, "total_steps": 40000, "loss": 0.065, "lr": 0.09397168259998541, "epoch": 1.21542520704566, "percentage": 62.19, "elapsed_time": "1 day, 2:19:49", "remaining_time": "16:00:35", "throughput": 332.4, "total_tokens": 31508320} {"current_steps": 24880, "total_steps": 40000, "loss": 0.0462, "lr": 0.09391704551812759, "epoch": 1.2156695087093543, "percentage": 62.2, "elapsed_time": "1 day, 2:19:52", "remaining_time": "16:00:06", "throughput": 332.46, "total_tokens": 31514368} {"current_steps": 24885, "total_steps": 40000, "loss": 0.0677, "lr": 0.09386241708496605, "epoch": 1.2159138103730487, "percentage": 62.21, "elapsed_time": "1 day, 2:19:55", "remaining_time": "15:59:38", "throughput": 332.51, "total_tokens": 31520416} {"current_steps": 24890, "total_steps": 40000, "loss": 0.0505, "lr": 0.09380779730892527, "epoch": 1.216158112036743, "percentage": 62.22, "elapsed_time": "1 day, 2:19:58", "remaining_time": "15:59:09", "throughput": 332.56, "total_tokens": 31526560} {"current_steps": 24895, "total_steps": 40000, "loss": 0.058, "lr": 0.09375318619842836, "epoch": 1.2164024137004372, "percentage": 62.24, "elapsed_time": "1 day, 2:20:01", "remaining_time": "15:58:40", "throughput": 332.62, "total_tokens": 31533344} {"current_steps": 24900, "total_steps": 40000, "loss": 0.0509, "lr": 0.09369858376189696, "epoch": 1.2166467153641316, "percentage": 62.25, "elapsed_time": "1 day, 2:20:04", "remaining_time": "15:58:12", "throughput": 332.69, "total_tokens": 31540320} {"current_steps": 24905, "total_steps": 40000, "loss": 0.0636, "lr": 0.09364399000775143, "epoch": 1.216891017027826, "percentage": 62.26, "elapsed_time": "1 day, 2:20:08", "remaining_time": "15:57:43", "throughput": 332.74, "total_tokens": 31546880} {"current_steps": 24910, "total_steps": 40000, "loss": 0.0527, "lr": 0.09358940494441093, "epoch": 1.2171353186915204, "percentage": 62.28, "elapsed_time": "1 day, 2:20:11", "remaining_time": "15:57:14", "throughput": 332.8, "total_tokens": 31553248} {"current_steps": 24915, "total_steps": 40000, "loss": 0.0734, "lr": 0.09353482858029301, "epoch": 1.2173796203552145, "percentage": 62.29, "elapsed_time": "1 day, 2:20:14", "remaining_time": "15:56:46", "throughput": 332.85, "total_tokens": 31559136} {"current_steps": 24920, "total_steps": 40000, "loss": 0.0785, "lr": 0.09348026092381419, "epoch": 1.217623922018909, "percentage": 62.3, "elapsed_time": "1 day, 2:20:17", "remaining_time": "15:56:17", "throughput": 332.91, "total_tokens": 31565440} {"current_steps": 24925, "total_steps": 40000, "loss": 0.0559, "lr": 0.09342570198338931, "epoch": 1.2178682236826033, "percentage": 62.31, "elapsed_time": "1 day, 2:20:20", "remaining_time": "15:55:48", "throughput": 332.97, "total_tokens": 31572512} {"current_steps": 24930, "total_steps": 40000, "loss": 0.0459, "lr": 0.0933711517674322, "epoch": 1.2181125253462977, "percentage": 62.32, "elapsed_time": "1 day, 2:20:23", "remaining_time": "15:55:20", "throughput": 333.03, "total_tokens": 31579008} {"current_steps": 24935, "total_steps": 40000, "loss": 0.0432, "lr": 0.09331661028435513, "epoch": 1.218356827009992, "percentage": 62.34, "elapsed_time": "1 day, 2:20:26", "remaining_time": "15:54:51", "throughput": 333.09, "total_tokens": 31585376} {"current_steps": 24940, "total_steps": 40000, "loss": 0.0496, "lr": 0.09326207754256909, "epoch": 1.2186011286736862, "percentage": 62.35, "elapsed_time": "1 day, 2:20:29", "remaining_time": "15:54:22", "throughput": 333.14, "total_tokens": 31591840} {"current_steps": 24945, "total_steps": 40000, "loss": 0.0483, "lr": 0.09320755355048366, "epoch": 1.2188454303373806, "percentage": 62.36, "elapsed_time": "1 day, 2:20:32", "remaining_time": "15:53:54", "throughput": 333.2, "total_tokens": 31598368} {"current_steps": 24950, "total_steps": 40000, "loss": 0.0406, "lr": 0.09315303831650722, "epoch": 1.219089732001075, "percentage": 62.38, "elapsed_time": "1 day, 2:20:36", "remaining_time": "15:53:25", "throughput": 333.26, "total_tokens": 31604992} {"current_steps": 24955, "total_steps": 40000, "loss": 0.053, "lr": 0.09309853184904661, "epoch": 1.2193340336647693, "percentage": 62.39, "elapsed_time": "1 day, 2:20:39", "remaining_time": "15:52:57", "throughput": 333.31, "total_tokens": 31611232} {"current_steps": 24960, "total_steps": 40000, "loss": 0.0526, "lr": 0.09304403415650753, "epoch": 1.2195783353284635, "percentage": 62.4, "elapsed_time": "1 day, 2:20:42", "remaining_time": "15:52:28", "throughput": 333.37, "total_tokens": 31617664} {"current_steps": 24965, "total_steps": 40000, "loss": 0.0577, "lr": 0.09298954524729405, "epoch": 1.2198226369921579, "percentage": 62.41, "elapsed_time": "1 day, 2:20:45", "remaining_time": "15:51:59", "throughput": 333.42, "total_tokens": 31623744} {"current_steps": 24970, "total_steps": 40000, "loss": 0.0663, "lr": 0.09293506512980916, "epoch": 1.2200669386558523, "percentage": 62.42, "elapsed_time": "1 day, 2:20:48", "remaining_time": "15:51:31", "throughput": 333.48, "total_tokens": 31630272} {"current_steps": 24975, "total_steps": 40000, "loss": 0.042, "lr": 0.0928805938124544, "epoch": 1.2203112403195466, "percentage": 62.44, "elapsed_time": "1 day, 2:20:51", "remaining_time": "15:51:02", "throughput": 333.54, "total_tokens": 31636704} {"current_steps": 24980, "total_steps": 40000, "loss": 0.0674, "lr": 0.09282613130362982, "epoch": 1.220555541983241, "percentage": 62.45, "elapsed_time": "1 day, 2:20:54", "remaining_time": "15:50:34", "throughput": 333.59, "total_tokens": 31642944} {"current_steps": 24985, "total_steps": 40000, "loss": 0.0569, "lr": 0.09277167761173427, "epoch": 1.2207998436469352, "percentage": 62.46, "elapsed_time": "1 day, 2:20:57", "remaining_time": "15:50:05", "throughput": 333.65, "total_tokens": 31649184} {"current_steps": 24990, "total_steps": 40000, "loss": 0.0366, "lr": 0.0927172327451653, "epoch": 1.2210441453106295, "percentage": 62.48, "elapsed_time": "1 day, 2:21:00", "remaining_time": "15:49:37", "throughput": 333.71, "total_tokens": 31655584} {"current_steps": 24995, "total_steps": 40000, "loss": 0.0708, "lr": 0.09266279671231882, "epoch": 1.221288446974324, "percentage": 62.49, "elapsed_time": "1 day, 2:21:03", "remaining_time": "15:49:08", "throughput": 333.75, "total_tokens": 31661152} {"current_steps": 25000, "total_steps": 40000, "loss": 0.0561, "lr": 0.09260836952158967, "epoch": 1.2215327486380183, "percentage": 62.5, "elapsed_time": "1 day, 2:21:07", "remaining_time": "15:48:40", "throughput": 333.81, "total_tokens": 31668000} {"current_steps": 25000, "total_steps": 40000, "eval_loss": 0.06361822783946991, "epoch": 1.2215327486380183, "percentage": 62.5, "elapsed_time": "1 day, 2:31:47", "remaining_time": "15:55:04", "throughput": 331.58, "total_tokens": 31668000} {"current_steps": 25005, "total_steps": 40000, "loss": 0.0729, "lr": 0.09255395118137114, "epoch": 1.2217770503017125, "percentage": 62.51, "elapsed_time": "1 day, 2:31:51", "remaining_time": "15:54:36", "throughput": 331.63, "total_tokens": 31674080} {"current_steps": 25010, "total_steps": 40000, "loss": 0.0432, "lr": 0.09249954170005527, "epoch": 1.2220213519654068, "percentage": 62.52, "elapsed_time": "1 day, 2:31:54", "remaining_time": "15:54:07", "throughput": 331.68, "total_tokens": 31680192} {"current_steps": 25015, "total_steps": 40000, "loss": 0.0739, "lr": 0.0924451410860327, "epoch": 1.2222656536291012, "percentage": 62.54, "elapsed_time": "1 day, 2:31:57", "remaining_time": "15:53:38", "throughput": 331.73, "total_tokens": 31686336} {"current_steps": 25020, "total_steps": 40000, "loss": 0.0456, "lr": 0.09239074934769258, "epoch": 1.2225099552927956, "percentage": 62.55, "elapsed_time": "1 day, 2:32:00", "remaining_time": "15:53:10", "throughput": 331.8, "total_tokens": 31693216} {"current_steps": 25025, "total_steps": 40000, "loss": 0.0568, "lr": 0.09233636649342288, "epoch": 1.22275425695649, "percentage": 62.56, "elapsed_time": "1 day, 2:32:03", "remaining_time": "15:52:41", "throughput": 331.85, "total_tokens": 31699392} {"current_steps": 25030, "total_steps": 40000, "loss": 0.0547, "lr": 0.09228199253161017, "epoch": 1.2229985586201841, "percentage": 62.58, "elapsed_time": "1 day, 2:32:06", "remaining_time": "15:52:12", "throughput": 331.9, "total_tokens": 31705504} {"current_steps": 25035, "total_steps": 40000, "loss": 0.0513, "lr": 0.09222762747063949, "epoch": 1.2232428602838785, "percentage": 62.59, "elapsed_time": "1 day, 2:32:09", "remaining_time": "15:51:44", "throughput": 331.96, "total_tokens": 31711872} {"current_steps": 25040, "total_steps": 40000, "loss": 0.0472, "lr": 0.09217327131889473, "epoch": 1.223487161947573, "percentage": 62.6, "elapsed_time": "1 day, 2:32:13", "remaining_time": "15:51:15", "throughput": 332.02, "total_tokens": 31718976} {"current_steps": 25045, "total_steps": 40000, "loss": 0.0706, "lr": 0.09211892408475818, "epoch": 1.2237314636112673, "percentage": 62.61, "elapsed_time": "1 day, 2:32:16", "remaining_time": "15:50:47", "throughput": 332.08, "total_tokens": 31725280} {"current_steps": 25050, "total_steps": 40000, "loss": 0.0388, "lr": 0.09206458577661089, "epoch": 1.2239757652749614, "percentage": 62.62, "elapsed_time": "1 day, 2:32:19", "remaining_time": "15:50:18", "throughput": 332.13, "total_tokens": 31731520} {"current_steps": 25055, "total_steps": 40000, "loss": 0.0569, "lr": 0.09201025640283263, "epoch": 1.2242200669386558, "percentage": 62.64, "elapsed_time": "1 day, 2:32:22", "remaining_time": "15:49:49", "throughput": 332.19, "total_tokens": 31737920} {"current_steps": 25060, "total_steps": 40000, "loss": 0.0555, "lr": 0.09195593597180148, "epoch": 1.2244643686023502, "percentage": 62.65, "elapsed_time": "1 day, 2:32:25", "remaining_time": "15:49:21", "throughput": 332.24, "total_tokens": 31743808} {"current_steps": 25065, "total_steps": 40000, "loss": 0.0813, "lr": 0.09190162449189444, "epoch": 1.2247086702660446, "percentage": 62.66, "elapsed_time": "1 day, 2:32:28", "remaining_time": "15:48:52", "throughput": 332.29, "total_tokens": 31750048} {"current_steps": 25070, "total_steps": 40000, "loss": 0.078, "lr": 0.09184732197148705, "epoch": 1.224952971929739, "percentage": 62.68, "elapsed_time": "1 day, 2:32:31", "remaining_time": "15:48:24", "throughput": 332.35, "total_tokens": 31756384} {"current_steps": 25075, "total_steps": 40000, "loss": 0.0306, "lr": 0.09179302841895343, "epoch": 1.2251972735934331, "percentage": 62.69, "elapsed_time": "1 day, 2:32:34", "remaining_time": "15:47:55", "throughput": 332.4, "total_tokens": 31762496} {"current_steps": 25080, "total_steps": 40000, "loss": 0.0582, "lr": 0.09173874384266625, "epoch": 1.2254415752571275, "percentage": 62.7, "elapsed_time": "1 day, 2:32:37", "remaining_time": "15:47:26", "throughput": 332.45, "total_tokens": 31768416} {"current_steps": 25085, "total_steps": 40000, "loss": 0.0683, "lr": 0.09168446825099695, "epoch": 1.2256858769208219, "percentage": 62.71, "elapsed_time": "1 day, 2:32:40", "remaining_time": "15:46:58", "throughput": 332.51, "total_tokens": 31774816} {"current_steps": 25090, "total_steps": 40000, "loss": 0.063, "lr": 0.09163020165231545, "epoch": 1.2259301785845163, "percentage": 62.72, "elapsed_time": "1 day, 2:32:43", "remaining_time": "15:46:29", "throughput": 332.56, "total_tokens": 31780960} {"current_steps": 25095, "total_steps": 40000, "loss": 0.0386, "lr": 0.09157594405499044, "epoch": 1.2261744802482104, "percentage": 62.74, "elapsed_time": "1 day, 2:32:46", "remaining_time": "15:46:01", "throughput": 332.62, "total_tokens": 31787104} {"current_steps": 25100, "total_steps": 40000, "loss": 0.0723, "lr": 0.09152169546738899, "epoch": 1.2264187819119048, "percentage": 62.75, "elapsed_time": "1 day, 2:32:49", "remaining_time": "15:45:32", "throughput": 332.67, "total_tokens": 31793280} {"current_steps": 25105, "total_steps": 40000, "loss": 0.0385, "lr": 0.09146745589787698, "epoch": 1.2266630835755992, "percentage": 62.76, "elapsed_time": "1 day, 2:32:52", "remaining_time": "15:45:04", "throughput": 332.73, "total_tokens": 31799584} {"current_steps": 25110, "total_steps": 40000, "loss": 0.0247, "lr": 0.09141322535481891, "epoch": 1.2269073852392935, "percentage": 62.78, "elapsed_time": "1 day, 2:32:55", "remaining_time": "15:44:35", "throughput": 332.78, "total_tokens": 31806240} {"current_steps": 25115, "total_steps": 40000, "loss": 0.0575, "lr": 0.0913590038465777, "epoch": 1.227151686902988, "percentage": 62.79, "elapsed_time": "1 day, 2:32:59", "remaining_time": "15:44:07", "throughput": 332.84, "total_tokens": 31812640} {"current_steps": 25120, "total_steps": 40000, "loss": 0.0402, "lr": 0.09130479138151505, "epoch": 1.227395988566682, "percentage": 62.8, "elapsed_time": "1 day, 2:33:02", "remaining_time": "15:43:38", "throughput": 332.9, "total_tokens": 31818976} {"current_steps": 25125, "total_steps": 40000, "loss": 0.0751, "lr": 0.09125058796799114, "epoch": 1.2276402902303765, "percentage": 62.81, "elapsed_time": "1 day, 2:33:05", "remaining_time": "15:43:10", "throughput": 332.95, "total_tokens": 31824736} {"current_steps": 25130, "total_steps": 40000, "loss": 0.0439, "lr": 0.09119639361436485, "epoch": 1.2278845918940708, "percentage": 62.82, "elapsed_time": "1 day, 2:33:08", "remaining_time": "15:42:41", "throughput": 333.0, "total_tokens": 31831232} {"current_steps": 25135, "total_steps": 40000, "loss": 0.0706, "lr": 0.09114220832899368, "epoch": 1.2281288935577652, "percentage": 62.84, "elapsed_time": "1 day, 2:33:11", "remaining_time": "15:42:13", "throughput": 333.06, "total_tokens": 31837568} {"current_steps": 25140, "total_steps": 40000, "loss": 0.051, "lr": 0.0910880321202336, "epoch": 1.2283731952214594, "percentage": 62.85, "elapsed_time": "1 day, 2:33:14", "remaining_time": "15:41:44", "throughput": 333.12, "total_tokens": 31843968} {"current_steps": 25145, "total_steps": 40000, "loss": 0.07, "lr": 0.09103386499643933, "epoch": 1.2286174968851538, "percentage": 62.86, "elapsed_time": "1 day, 2:33:17", "remaining_time": "15:41:16", "throughput": 333.17, "total_tokens": 31850016} {"current_steps": 25150, "total_steps": 40000, "loss": 0.0572, "lr": 0.09097970696596407, "epoch": 1.2288617985488481, "percentage": 62.88, "elapsed_time": "1 day, 2:33:20", "remaining_time": "15:40:48", "throughput": 333.23, "total_tokens": 31856640} {"current_steps": 25155, "total_steps": 40000, "loss": 0.0481, "lr": 0.09092555803715971, "epoch": 1.2291061002125425, "percentage": 62.89, "elapsed_time": "1 day, 2:33:23", "remaining_time": "15:40:19", "throughput": 333.28, "total_tokens": 31862848} {"current_steps": 25160, "total_steps": 40000, "loss": 0.0486, "lr": 0.0908714182183767, "epoch": 1.229350401876237, "percentage": 62.9, "elapsed_time": "1 day, 2:33:26", "remaining_time": "15:39:51", "throughput": 333.34, "total_tokens": 31869152} {"current_steps": 25165, "total_steps": 40000, "loss": 0.0573, "lr": 0.090817287517964, "epoch": 1.229594703539931, "percentage": 62.91, "elapsed_time": "1 day, 2:33:29", "remaining_time": "15:39:22", "throughput": 333.39, "total_tokens": 31875296} {"current_steps": 25170, "total_steps": 40000, "loss": 0.057, "lr": 0.09076316594426931, "epoch": 1.2298390052036254, "percentage": 62.92, "elapsed_time": "1 day, 2:33:33", "remaining_time": "15:38:54", "throughput": 333.45, "total_tokens": 31882336} {"current_steps": 25175, "total_steps": 40000, "loss": 0.0434, "lr": 0.09070905350563888, "epoch": 1.2300833068673198, "percentage": 62.94, "elapsed_time": "1 day, 2:33:36", "remaining_time": "15:38:26", "throughput": 333.51, "total_tokens": 31889184} {"current_steps": 25180, "total_steps": 40000, "loss": 0.0592, "lr": 0.09065495021041745, "epoch": 1.230327608531014, "percentage": 62.95, "elapsed_time": "1 day, 2:33:39", "remaining_time": "15:37:57", "throughput": 333.57, "total_tokens": 31895456} {"current_steps": 25185, "total_steps": 40000, "loss": 0.0438, "lr": 0.09060085606694851, "epoch": 1.2305719101947084, "percentage": 62.96, "elapsed_time": "1 day, 2:33:42", "remaining_time": "15:37:29", "throughput": 333.62, "total_tokens": 31901280} {"current_steps": 25190, "total_steps": 40000, "loss": 0.086, "lr": 0.09054677108357405, "epoch": 1.2308162118584027, "percentage": 62.98, "elapsed_time": "1 day, 2:33:45", "remaining_time": "15:37:01", "throughput": 333.67, "total_tokens": 31907136} {"current_steps": 25195, "total_steps": 40000, "loss": 0.0532, "lr": 0.09049269526863457, "epoch": 1.231060513522097, "percentage": 62.99, "elapsed_time": "1 day, 2:33:48", "remaining_time": "15:36:32", "throughput": 333.73, "total_tokens": 31913824} {"current_steps": 25200, "total_steps": 40000, "loss": 0.0488, "lr": 0.09043862863046935, "epoch": 1.2313048151857915, "percentage": 63.0, "elapsed_time": "1 day, 2:33:51", "remaining_time": "15:36:04", "throughput": 333.78, "total_tokens": 31919712} {"current_steps": 25200, "total_steps": 40000, "eval_loss": 0.06320296227931976, "epoch": 1.2313048151857915, "percentage": 63.0, "elapsed_time": "1 day, 2:44:30", "remaining_time": "15:42:20", "throughput": 331.56, "total_tokens": 31919712} {"current_steps": 25205, "total_steps": 40000, "loss": 0.0703, "lr": 0.09038457117741602, "epoch": 1.2315491168494859, "percentage": 63.01, "elapsed_time": "1 day, 2:44:34", "remaining_time": "15:41:51", "throughput": 331.62, "total_tokens": 31926304} {"current_steps": 25210, "total_steps": 40000, "loss": 0.0773, "lr": 0.09033052291781099, "epoch": 1.23179341851318, "percentage": 63.02, "elapsed_time": "1 day, 2:44:37", "remaining_time": "15:41:23", "throughput": 331.67, "total_tokens": 31932448} {"current_steps": 25215, "total_steps": 40000, "loss": 0.0546, "lr": 0.09027648385998926, "epoch": 1.2320377201768744, "percentage": 63.04, "elapsed_time": "1 day, 2:44:40", "remaining_time": "15:40:55", "throughput": 331.73, "total_tokens": 31938816} {"current_steps": 25220, "total_steps": 40000, "loss": 0.0474, "lr": 0.09022245401228417, "epoch": 1.2322820218405688, "percentage": 63.05, "elapsed_time": "1 day, 2:44:43", "remaining_time": "15:40:26", "throughput": 331.78, "total_tokens": 31944992} {"current_steps": 25225, "total_steps": 40000, "loss": 0.0481, "lr": 0.09016843338302792, "epoch": 1.232526323504263, "percentage": 63.06, "elapsed_time": "1 day, 2:44:46", "remaining_time": "15:39:58", "throughput": 331.83, "total_tokens": 31951072} {"current_steps": 25230, "total_steps": 40000, "loss": 0.0432, "lr": 0.09011442198055115, "epoch": 1.2327706251679573, "percentage": 63.08, "elapsed_time": "1 day, 2:44:50", "remaining_time": "15:39:29", "throughput": 331.88, "total_tokens": 31957152} {"current_steps": 25235, "total_steps": 40000, "loss": 0.0537, "lr": 0.09006041981318305, "epoch": 1.2330149268316517, "percentage": 63.09, "elapsed_time": "1 day, 2:44:53", "remaining_time": "15:39:01", "throughput": 331.94, "total_tokens": 31963360} {"current_steps": 25240, "total_steps": 40000, "loss": 0.0661, "lr": 0.09000642688925149, "epoch": 1.233259228495346, "percentage": 63.1, "elapsed_time": "1 day, 2:44:56", "remaining_time": "15:38:32", "throughput": 332.0, "total_tokens": 31970016} {"current_steps": 25245, "total_steps": 40000, "loss": 0.0595, "lr": 0.0899524432170828, "epoch": 1.2335035301590405, "percentage": 63.11, "elapsed_time": "1 day, 2:44:59", "remaining_time": "15:38:04", "throughput": 332.05, "total_tokens": 31976160} {"current_steps": 25250, "total_steps": 40000, "loss": 0.0746, "lr": 0.08989846880500196, "epoch": 1.2337478318227346, "percentage": 63.12, "elapsed_time": "1 day, 2:45:02", "remaining_time": "15:37:35", "throughput": 332.11, "total_tokens": 31983008} {"current_steps": 25255, "total_steps": 40000, "loss": 0.0791, "lr": 0.08984450366133256, "epoch": 1.233992133486429, "percentage": 63.14, "elapsed_time": "1 day, 2:45:05", "remaining_time": "15:37:07", "throughput": 332.16, "total_tokens": 31989280} {"current_steps": 25260, "total_steps": 40000, "loss": 0.0757, "lr": 0.08979054779439664, "epoch": 1.2342364351501234, "percentage": 63.15, "elapsed_time": "1 day, 2:45:08", "remaining_time": "15:36:39", "throughput": 332.22, "total_tokens": 31995776} {"current_steps": 25265, "total_steps": 40000, "loss": 0.0586, "lr": 0.08973660121251485, "epoch": 1.2344807368138178, "percentage": 63.16, "elapsed_time": "1 day, 2:45:11", "remaining_time": "15:36:10", "throughput": 332.28, "total_tokens": 32002112} {"current_steps": 25270, "total_steps": 40000, "loss": 0.0656, "lr": 0.08968266392400655, "epoch": 1.234725038477512, "percentage": 63.18, "elapsed_time": "1 day, 2:45:14", "remaining_time": "15:35:42", "throughput": 332.33, "total_tokens": 32008384} {"current_steps": 25275, "total_steps": 40000, "loss": 0.0586, "lr": 0.0896287359371894, "epoch": 1.2349693401412063, "percentage": 63.19, "elapsed_time": "1 day, 2:45:17", "remaining_time": "15:35:13", "throughput": 332.38, "total_tokens": 32014400} {"current_steps": 25280, "total_steps": 40000, "loss": 0.0556, "lr": 0.08957481726037989, "epoch": 1.2352136418049007, "percentage": 63.2, "elapsed_time": "1 day, 2:45:20", "remaining_time": "15:34:45", "throughput": 332.44, "total_tokens": 32020448} {"current_steps": 25285, "total_steps": 40000, "loss": 0.0458, "lr": 0.08952090790189286, "epoch": 1.235457943468595, "percentage": 63.21, "elapsed_time": "1 day, 2:45:24", "remaining_time": "15:34:17", "throughput": 332.49, "total_tokens": 32027008} {"current_steps": 25290, "total_steps": 40000, "loss": 0.0883, "lr": 0.08946700787004187, "epoch": 1.2357022451322894, "percentage": 63.22, "elapsed_time": "1 day, 2:45:26", "remaining_time": "15:33:48", "throughput": 332.54, "total_tokens": 32032800} {"current_steps": 25295, "total_steps": 40000, "loss": 0.0497, "lr": 0.08941311717313899, "epoch": 1.2359465467959836, "percentage": 63.24, "elapsed_time": "1 day, 2:45:30", "remaining_time": "15:33:20", "throughput": 332.6, "total_tokens": 32039200} {"current_steps": 25300, "total_steps": 40000, "loss": 0.0776, "lr": 0.08935923581949483, "epoch": 1.236190848459678, "percentage": 63.25, "elapsed_time": "1 day, 2:45:33", "remaining_time": "15:32:52", "throughput": 332.66, "total_tokens": 32045824} {"current_steps": 25305, "total_steps": 40000, "loss": 0.046, "lr": 0.0893053638174185, "epoch": 1.2364351501233724, "percentage": 63.26, "elapsed_time": "1 day, 2:45:36", "remaining_time": "15:32:23", "throughput": 332.71, "total_tokens": 32052064} {"current_steps": 25310, "total_steps": 40000, "loss": 0.0503, "lr": 0.0892515011752179, "epoch": 1.2366794517870667, "percentage": 63.28, "elapsed_time": "1 day, 2:45:39", "remaining_time": "15:31:55", "throughput": 332.77, "total_tokens": 32058528} {"current_steps": 25315, "total_steps": 40000, "loss": 0.0691, "lr": 0.08919764790119918, "epoch": 1.2369237534507609, "percentage": 63.29, "elapsed_time": "1 day, 2:45:42", "remaining_time": "15:31:27", "throughput": 332.82, "total_tokens": 32064576} {"current_steps": 25320, "total_steps": 40000, "loss": 0.034, "lr": 0.08914380400366727, "epoch": 1.2371680551144553, "percentage": 63.3, "elapsed_time": "1 day, 2:45:45", "remaining_time": "15:30:59", "throughput": 332.87, "total_tokens": 32070592} {"current_steps": 25325, "total_steps": 40000, "loss": 0.0463, "lr": 0.08908996949092551, "epoch": 1.2374123567781496, "percentage": 63.31, "elapsed_time": "1 day, 2:45:48", "remaining_time": "15:30:30", "throughput": 332.93, "total_tokens": 32076960} {"current_steps": 25330, "total_steps": 40000, "loss": 0.081, "lr": 0.08903614437127592, "epoch": 1.237656658441844, "percentage": 63.32, "elapsed_time": "1 day, 2:45:51", "remaining_time": "15:30:02", "throughput": 332.98, "total_tokens": 32083168} {"current_steps": 25335, "total_steps": 40000, "loss": 0.0551, "lr": 0.088982328653019, "epoch": 1.2379009601055384, "percentage": 63.34, "elapsed_time": "1 day, 2:45:54", "remaining_time": "15:29:34", "throughput": 333.04, "total_tokens": 32089728} {"current_steps": 25340, "total_steps": 40000, "loss": 0.0808, "lr": 0.0889285223444538, "epoch": 1.2381452617692326, "percentage": 63.35, "elapsed_time": "1 day, 2:45:57", "remaining_time": "15:29:06", "throughput": 333.09, "total_tokens": 32095936} {"current_steps": 25345, "total_steps": 40000, "loss": 0.069, "lr": 0.08887472545387787, "epoch": 1.238389563432927, "percentage": 63.36, "elapsed_time": "1 day, 2:46:00", "remaining_time": "15:28:37", "throughput": 333.15, "total_tokens": 32102336} {"current_steps": 25350, "total_steps": 40000, "loss": 0.0391, "lr": 0.08882093798958751, "epoch": 1.2386338650966213, "percentage": 63.38, "elapsed_time": "1 day, 2:46:03", "remaining_time": "15:28:09", "throughput": 333.2, "total_tokens": 32108672} {"current_steps": 25355, "total_steps": 40000, "loss": 0.0704, "lr": 0.08876715995987726, "epoch": 1.2388781667603157, "percentage": 63.39, "elapsed_time": "1 day, 2:46:07", "remaining_time": "15:27:41", "throughput": 333.26, "total_tokens": 32115072} {"current_steps": 25360, "total_steps": 40000, "loss": 0.0727, "lr": 0.08871339137304052, "epoch": 1.2391224684240099, "percentage": 63.4, "elapsed_time": "1 day, 2:46:10", "remaining_time": "15:27:13", "throughput": 333.32, "total_tokens": 32121728} {"current_steps": 25365, "total_steps": 40000, "loss": 0.0504, "lr": 0.0886596322373689, "epoch": 1.2393667700877042, "percentage": 63.41, "elapsed_time": "1 day, 2:46:13", "remaining_time": "15:26:45", "throughput": 333.38, "total_tokens": 32128576} {"current_steps": 25370, "total_steps": 40000, "loss": 0.0475, "lr": 0.08860588256115293, "epoch": 1.2396110717513986, "percentage": 63.42, "elapsed_time": "1 day, 2:46:16", "remaining_time": "15:26:16", "throughput": 333.44, "total_tokens": 32135296} {"current_steps": 25375, "total_steps": 40000, "loss": 0.055, "lr": 0.0885521423526814, "epoch": 1.239855373415093, "percentage": 63.44, "elapsed_time": "1 day, 2:46:19", "remaining_time": "15:25:48", "throughput": 333.49, "total_tokens": 32141152} {"current_steps": 25380, "total_steps": 40000, "loss": 0.0647, "lr": 0.08849841162024165, "epoch": 1.2400996750787874, "percentage": 63.45, "elapsed_time": "1 day, 2:46:22", "remaining_time": "15:25:20", "throughput": 333.54, "total_tokens": 32147104} {"current_steps": 25385, "total_steps": 40000, "loss": 0.1029, "lr": 0.08844469037211973, "epoch": 1.2403439767424815, "percentage": 63.46, "elapsed_time": "1 day, 2:46:25", "remaining_time": "15:24:52", "throughput": 333.59, "total_tokens": 32153568} {"current_steps": 25390, "total_steps": 40000, "loss": 0.0616, "lr": 0.08839097861660014, "epoch": 1.240588278406176, "percentage": 63.48, "elapsed_time": "1 day, 2:46:28", "remaining_time": "15:24:24", "throughput": 333.65, "total_tokens": 32160000} {"current_steps": 25395, "total_steps": 40000, "loss": 0.0551, "lr": 0.08833727636196585, "epoch": 1.2408325800698703, "percentage": 63.49, "elapsed_time": "1 day, 2:46:31", "remaining_time": "15:23:56", "throughput": 333.7, "total_tokens": 32166144} {"current_steps": 25400, "total_steps": 40000, "loss": 0.0365, "lr": 0.08828358361649848, "epoch": 1.2410768817335647, "percentage": 63.5, "elapsed_time": "1 day, 2:46:34", "remaining_time": "15:23:28", "throughput": 333.75, "total_tokens": 32172256} {"current_steps": 25400, "total_steps": 40000, "eval_loss": 0.06324383616447449, "epoch": 1.2410768817335647, "percentage": 63.5, "elapsed_time": "1 day, 2:57:15", "remaining_time": "15:29:36", "throughput": 331.55, "total_tokens": 32172256} {"current_steps": 25405, "total_steps": 40000, "loss": 0.055, "lr": 0.08822990038847807, "epoch": 1.2413211833972588, "percentage": 63.51, "elapsed_time": "1 day, 2:57:20", "remaining_time": "15:29:08", "throughput": 331.6, "total_tokens": 32178304} {"current_steps": 25410, "total_steps": 40000, "loss": 0.0595, "lr": 0.08817622668618325, "epoch": 1.2415654850609532, "percentage": 63.52, "elapsed_time": "1 day, 2:57:23", "remaining_time": "15:28:40", "throughput": 331.65, "total_tokens": 32183968} {"current_steps": 25415, "total_steps": 40000, "loss": 0.0725, "lr": 0.08812256251789125, "epoch": 1.2418097867246476, "percentage": 63.54, "elapsed_time": "1 day, 2:57:26", "remaining_time": "15:28:12", "throughput": 331.7, "total_tokens": 32190400} {"current_steps": 25420, "total_steps": 40000, "loss": 0.0596, "lr": 0.08806890789187766, "epoch": 1.242054088388342, "percentage": 63.55, "elapsed_time": "1 day, 2:57:29", "remaining_time": "15:27:43", "throughput": 331.75, "total_tokens": 32196512} {"current_steps": 25425, "total_steps": 40000, "loss": 0.08, "lr": 0.08801526281641672, "epoch": 1.2422983900520363, "percentage": 63.56, "elapsed_time": "1 day, 2:57:32", "remaining_time": "15:27:15", "throughput": 331.81, "total_tokens": 32202528} {"current_steps": 25430, "total_steps": 40000, "loss": 0.0732, "lr": 0.0879616272997813, "epoch": 1.2425426917157305, "percentage": 63.58, "elapsed_time": "1 day, 2:57:35", "remaining_time": "15:26:47", "throughput": 331.85, "total_tokens": 32208256} {"current_steps": 25435, "total_steps": 40000, "loss": 0.0528, "lr": 0.08790800135024247, "epoch": 1.2427869933794249, "percentage": 63.59, "elapsed_time": "1 day, 2:57:38", "remaining_time": "15:26:19", "throughput": 331.91, "total_tokens": 32214240} {"current_steps": 25440, "total_steps": 40000, "loss": 0.0548, "lr": 0.08785438497607023, "epoch": 1.2430312950431193, "percentage": 63.6, "elapsed_time": "1 day, 2:57:41", "remaining_time": "15:25:50", "throughput": 331.96, "total_tokens": 32220064} {"current_steps": 25445, "total_steps": 40000, "loss": 0.0382, "lr": 0.08780077818553277, "epoch": 1.2432755967068136, "percentage": 63.61, "elapsed_time": "1 day, 2:57:44", "remaining_time": "15:25:22", "throughput": 332.01, "total_tokens": 32226048} {"current_steps": 25450, "total_steps": 40000, "loss": 0.0467, "lr": 0.0877471809868969, "epoch": 1.2435198983705078, "percentage": 63.62, "elapsed_time": "1 day, 2:57:47", "remaining_time": "15:24:54", "throughput": 332.06, "total_tokens": 32232032} {"current_steps": 25455, "total_steps": 40000, "loss": 0.0402, "lr": 0.08769359338842811, "epoch": 1.2437642000342022, "percentage": 63.64, "elapsed_time": "1 day, 2:57:50", "remaining_time": "15:24:26", "throughput": 332.12, "total_tokens": 32239008} {"current_steps": 25460, "total_steps": 40000, "loss": 0.0876, "lr": 0.08764001539839016, "epoch": 1.2440085016978966, "percentage": 63.65, "elapsed_time": "1 day, 2:57:53", "remaining_time": "15:23:57", "throughput": 332.17, "total_tokens": 32245248} {"current_steps": 25465, "total_steps": 40000, "loss": 0.0528, "lr": 0.08758644702504548, "epoch": 1.244252803361591, "percentage": 63.66, "elapsed_time": "1 day, 2:57:56", "remaining_time": "15:23:29", "throughput": 332.23, "total_tokens": 32251616} {"current_steps": 25470, "total_steps": 40000, "loss": 0.0666, "lr": 0.0875328882766551, "epoch": 1.2444971050252853, "percentage": 63.68, "elapsed_time": "1 day, 2:57:59", "remaining_time": "15:23:01", "throughput": 332.28, "total_tokens": 32258080} {"current_steps": 25475, "total_steps": 40000, "loss": 0.0359, "lr": 0.08747933916147828, "epoch": 1.2447414066889795, "percentage": 63.69, "elapsed_time": "1 day, 2:58:03", "remaining_time": "15:22:33", "throughput": 332.34, "total_tokens": 32264672} {"current_steps": 25480, "total_steps": 40000, "loss": 0.0618, "lr": 0.0874257996877731, "epoch": 1.2449857083526739, "percentage": 63.7, "elapsed_time": "1 day, 2:58:06", "remaining_time": "15:22:05", "throughput": 332.4, "total_tokens": 32271456} {"current_steps": 25485, "total_steps": 40000, "loss": 0.0544, "lr": 0.08737226986379593, "epoch": 1.2452300100163682, "percentage": 63.71, "elapsed_time": "1 day, 2:58:09", "remaining_time": "15:21:37", "throughput": 332.45, "total_tokens": 32277728} {"current_steps": 25490, "total_steps": 40000, "loss": 0.0597, "lr": 0.08731874969780173, "epoch": 1.2454743116800626, "percentage": 63.73, "elapsed_time": "1 day, 2:58:12", "remaining_time": "15:21:09", "throughput": 332.51, "total_tokens": 32283904} {"current_steps": 25495, "total_steps": 40000, "loss": 0.0704, "lr": 0.08726523919804412, "epoch": 1.2457186133437568, "percentage": 63.74, "elapsed_time": "1 day, 2:58:15", "remaining_time": "15:20:41", "throughput": 332.56, "total_tokens": 32290496} {"current_steps": 25500, "total_steps": 40000, "loss": 0.0469, "lr": 0.08721173837277492, "epoch": 1.2459629150074512, "percentage": 63.75, "elapsed_time": "1 day, 2:58:18", "remaining_time": "15:20:12", "throughput": 332.62, "total_tokens": 32297152} {"current_steps": 25505, "total_steps": 40000, "loss": 0.062, "lr": 0.08715824723024479, "epoch": 1.2462072166711455, "percentage": 63.76, "elapsed_time": "1 day, 2:58:21", "remaining_time": "15:19:44", "throughput": 332.68, "total_tokens": 32303776} {"current_steps": 25510, "total_steps": 40000, "loss": 0.0358, "lr": 0.08710476577870258, "epoch": 1.24645151833484, "percentage": 63.78, "elapsed_time": "1 day, 2:58:24", "remaining_time": "15:19:16", "throughput": 332.74, "total_tokens": 32310464} {"current_steps": 25515, "total_steps": 40000, "loss": 0.0578, "lr": 0.08705129402639587, "epoch": 1.2466958199985343, "percentage": 63.79, "elapsed_time": "1 day, 2:58:27", "remaining_time": "15:18:48", "throughput": 332.79, "total_tokens": 32316736} {"current_steps": 25520, "total_steps": 40000, "loss": 0.0599, "lr": 0.08699783198157078, "epoch": 1.2469401216622285, "percentage": 63.8, "elapsed_time": "1 day, 2:58:31", "remaining_time": "15:18:20", "throughput": 332.84, "total_tokens": 32322752} {"current_steps": 25525, "total_steps": 40000, "loss": 0.0506, "lr": 0.08694437965247163, "epoch": 1.2471844233259228, "percentage": 63.81, "elapsed_time": "1 day, 2:58:34", "remaining_time": "15:17:52", "throughput": 332.9, "total_tokens": 32329504} {"current_steps": 25530, "total_steps": 40000, "loss": 0.0527, "lr": 0.08689093704734165, "epoch": 1.2474287249896172, "percentage": 63.82, "elapsed_time": "1 day, 2:58:37", "remaining_time": "15:17:24", "throughput": 332.96, "total_tokens": 32336032} {"current_steps": 25535, "total_steps": 40000, "loss": 0.0399, "lr": 0.08683750417442222, "epoch": 1.2476730266533116, "percentage": 63.84, "elapsed_time": "1 day, 2:58:40", "remaining_time": "15:16:56", "throughput": 333.01, "total_tokens": 32342496} {"current_steps": 25540, "total_steps": 40000, "loss": 0.0732, "lr": 0.08678408104195334, "epoch": 1.2479173283170057, "percentage": 63.85, "elapsed_time": "1 day, 2:58:43", "remaining_time": "15:16:28", "throughput": 333.07, "total_tokens": 32348800} {"current_steps": 25545, "total_steps": 40000, "loss": 0.0531, "lr": 0.08673066765817365, "epoch": 1.2481616299807001, "percentage": 63.86, "elapsed_time": "1 day, 2:58:46", "remaining_time": "15:16:00", "throughput": 333.12, "total_tokens": 32355136} {"current_steps": 25550, "total_steps": 40000, "loss": 0.0404, "lr": 0.08667726403132005, "epoch": 1.2484059316443945, "percentage": 63.88, "elapsed_time": "1 day, 2:58:49", "remaining_time": "15:15:32", "throughput": 333.17, "total_tokens": 32361184} {"current_steps": 25555, "total_steps": 40000, "loss": 0.0601, "lr": 0.0866238701696281, "epoch": 1.2486502333080889, "percentage": 63.89, "elapsed_time": "1 day, 2:58:52", "remaining_time": "15:15:04", "throughput": 333.23, "total_tokens": 32367520} {"current_steps": 25560, "total_steps": 40000, "loss": 0.0297, "lr": 0.08657048608133185, "epoch": 1.2488945349717833, "percentage": 63.9, "elapsed_time": "1 day, 2:58:55", "remaining_time": "15:14:36", "throughput": 333.28, "total_tokens": 32373504} {"current_steps": 25565, "total_steps": 40000, "loss": 0.049, "lr": 0.08651711177466369, "epoch": 1.2491388366354774, "percentage": 63.91, "elapsed_time": "1 day, 2:58:58", "remaining_time": "15:14:08", "throughput": 333.34, "total_tokens": 32380256} {"current_steps": 25570, "total_steps": 40000, "loss": 0.0549, "lr": 0.08646374725785466, "epoch": 1.2493831382991718, "percentage": 63.92, "elapsed_time": "1 day, 2:59:02", "remaining_time": "15:13:40", "throughput": 333.4, "total_tokens": 32387008} {"current_steps": 25575, "total_steps": 40000, "loss": 0.074, "lr": 0.08641039253913434, "epoch": 1.2496274399628662, "percentage": 63.94, "elapsed_time": "1 day, 2:59:05", "remaining_time": "15:13:12", "throughput": 333.46, "total_tokens": 32393632} {"current_steps": 25580, "total_steps": 40000, "loss": 0.0542, "lr": 0.08635704762673052, "epoch": 1.2498717416265606, "percentage": 63.95, "elapsed_time": "1 day, 2:59:08", "remaining_time": "15:12:44", "throughput": 333.51, "total_tokens": 32399680} {"current_steps": 25585, "total_steps": 40000, "loss": 0.0592, "lr": 0.08630371252886981, "epoch": 1.2501160432902547, "percentage": 63.96, "elapsed_time": "1 day, 2:59:11", "remaining_time": "15:12:16", "throughput": 333.56, "total_tokens": 32406112} {"current_steps": 25590, "total_steps": 40000, "loss": 0.0728, "lr": 0.08625038725377704, "epoch": 1.250360344953949, "percentage": 63.98, "elapsed_time": "1 day, 2:59:14", "remaining_time": "15:11:48", "throughput": 333.61, "total_tokens": 32411808} {"current_steps": 25595, "total_steps": 40000, "loss": 0.0475, "lr": 0.08619707180967566, "epoch": 1.2506046466176435, "percentage": 63.99, "elapsed_time": "1 day, 2:59:17", "remaining_time": "15:11:20", "throughput": 333.67, "total_tokens": 32418336} {"current_steps": 25600, "total_steps": 40000, "loss": 0.0536, "lr": 0.08614376620478768, "epoch": 1.2508489482813379, "percentage": 64.0, "elapsed_time": "1 day, 2:59:20", "remaining_time": "15:10:52", "throughput": 333.72, "total_tokens": 32424512} {"current_steps": 25600, "total_steps": 40000, "eval_loss": 0.06467566639184952, "epoch": 1.2508489482813379, "percentage": 64.0, "elapsed_time": "1 day, 3:10:00", "remaining_time": "15:16:52", "throughput": 331.54, "total_tokens": 32424512} {"current_steps": 25605, "total_steps": 40000, "loss": 0.0719, "lr": 0.08609047044733344, "epoch": 1.2510932499450322, "percentage": 64.01, "elapsed_time": "1 day, 3:10:05", "remaining_time": "15:16:25", "throughput": 331.59, "total_tokens": 32431168} {"current_steps": 25610, "total_steps": 40000, "loss": 0.0652, "lr": 0.08603718454553168, "epoch": 1.2513375516087264, "percentage": 64.03, "elapsed_time": "1 day, 3:10:08", "remaining_time": "15:15:57", "throughput": 331.64, "total_tokens": 32437344} {"current_steps": 25615, "total_steps": 40000, "loss": 0.0554, "lr": 0.08598390850759997, "epoch": 1.2515818532724208, "percentage": 64.04, "elapsed_time": "1 day, 3:10:11", "remaining_time": "15:15:29", "throughput": 331.7, "total_tokens": 32443584} {"current_steps": 25620, "total_steps": 40000, "loss": 0.0394, "lr": 0.08593064234175397, "epoch": 1.2518261549361152, "percentage": 64.05, "elapsed_time": "1 day, 3:10:14", "remaining_time": "15:15:01", "throughput": 331.75, "total_tokens": 32449600} {"current_steps": 25625, "total_steps": 40000, "loss": 0.0843, "lr": 0.08587738605620815, "epoch": 1.2520704565998093, "percentage": 64.06, "elapsed_time": "1 day, 3:10:17", "remaining_time": "15:14:33", "throughput": 331.8, "total_tokens": 32456288} {"current_steps": 25630, "total_steps": 40000, "loss": 0.0434, "lr": 0.08582413965917512, "epoch": 1.2523147582635037, "percentage": 64.08, "elapsed_time": "1 day, 3:10:20", "remaining_time": "15:14:05", "throughput": 331.86, "total_tokens": 32463008} {"current_steps": 25635, "total_steps": 40000, "loss": 0.0473, "lr": 0.08577090315886628, "epoch": 1.252559059927198, "percentage": 64.09, "elapsed_time": "1 day, 3:10:23", "remaining_time": "15:13:37", "throughput": 331.92, "total_tokens": 32469504} {"current_steps": 25640, "total_steps": 40000, "loss": 0.0484, "lr": 0.08571767656349136, "epoch": 1.2528033615908925, "percentage": 64.1, "elapsed_time": "1 day, 3:10:26", "remaining_time": "15:13:09", "throughput": 331.97, "total_tokens": 32475872} {"current_steps": 25645, "total_steps": 40000, "loss": 0.0587, "lr": 0.08566445988125847, "epoch": 1.2530476632545868, "percentage": 64.11, "elapsed_time": "1 day, 3:10:30", "remaining_time": "15:12:41", "throughput": 332.03, "total_tokens": 32482432} {"current_steps": 25650, "total_steps": 40000, "loss": 0.0481, "lr": 0.08561125312037436, "epoch": 1.2532919649182812, "percentage": 64.12, "elapsed_time": "1 day, 3:10:33", "remaining_time": "15:12:13", "throughput": 332.09, "total_tokens": 32488960} {"current_steps": 25655, "total_steps": 40000, "loss": 0.0764, "lr": 0.08555805628904424, "epoch": 1.2535362665819754, "percentage": 64.14, "elapsed_time": "1 day, 3:10:36", "remaining_time": "15:11:45", "throughput": 332.14, "total_tokens": 32495008} {"current_steps": 25660, "total_steps": 40000, "loss": 0.0638, "lr": 0.08550486939547161, "epoch": 1.2537805682456697, "percentage": 64.15, "elapsed_time": "1 day, 3:10:39", "remaining_time": "15:11:17", "throughput": 332.19, "total_tokens": 32501152} {"current_steps": 25665, "total_steps": 40000, "loss": 0.0606, "lr": 0.08545169244785869, "epoch": 1.2540248699093641, "percentage": 64.16, "elapsed_time": "1 day, 3:10:42", "remaining_time": "15:10:49", "throughput": 332.25, "total_tokens": 32507744} {"current_steps": 25670, "total_steps": 40000, "loss": 0.0722, "lr": 0.08539852545440589, "epoch": 1.2542691715730583, "percentage": 64.18, "elapsed_time": "1 day, 3:10:45", "remaining_time": "15:10:21", "throughput": 332.3, "total_tokens": 32514528} {"current_steps": 25675, "total_steps": 40000, "loss": 0.073, "lr": 0.08534536842331235, "epoch": 1.2545134732367527, "percentage": 64.19, "elapsed_time": "1 day, 3:10:48", "remaining_time": "15:09:53", "throughput": 332.36, "total_tokens": 32520704} {"current_steps": 25680, "total_steps": 40000, "loss": 0.0327, "lr": 0.08529222136277545, "epoch": 1.254757774900447, "percentage": 64.2, "elapsed_time": "1 day, 3:10:51", "remaining_time": "15:09:25", "throughput": 332.41, "total_tokens": 32527264} {"current_steps": 25685, "total_steps": 40000, "loss": 0.0619, "lr": 0.08523908428099125, "epoch": 1.2550020765641414, "percentage": 64.21, "elapsed_time": "1 day, 3:10:54", "remaining_time": "15:08:57", "throughput": 332.47, "total_tokens": 32533440} {"current_steps": 25690, "total_steps": 40000, "loss": 0.0394, "lr": 0.08518595718615402, "epoch": 1.2552463782278358, "percentage": 64.22, "elapsed_time": "1 day, 3:10:57", "remaining_time": "15:08:29", "throughput": 332.52, "total_tokens": 32540128} {"current_steps": 25695, "total_steps": 40000, "loss": 0.0591, "lr": 0.08513284008645675, "epoch": 1.2554906798915302, "percentage": 64.24, "elapsed_time": "1 day, 3:11:00", "remaining_time": "15:08:01", "throughput": 332.57, "total_tokens": 32545824} {"current_steps": 25700, "total_steps": 40000, "loss": 0.078, "lr": 0.08507973299009065, "epoch": 1.2557349815552243, "percentage": 64.25, "elapsed_time": "1 day, 3:11:03", "remaining_time": "15:07:33", "throughput": 332.62, "total_tokens": 32551936} {"current_steps": 25705, "total_steps": 40000, "loss": 0.0616, "lr": 0.08502663590524563, "epoch": 1.2559792832189187, "percentage": 64.26, "elapsed_time": "1 day, 3:11:07", "remaining_time": "15:07:05", "throughput": 332.68, "total_tokens": 32558752} {"current_steps": 25710, "total_steps": 40000, "loss": 0.051, "lr": 0.08497354884010981, "epoch": 1.256223584882613, "percentage": 64.28, "elapsed_time": "1 day, 3:11:10", "remaining_time": "15:06:37", "throughput": 332.74, "total_tokens": 32565312} {"current_steps": 25715, "total_steps": 40000, "loss": 0.0573, "lr": 0.0849204718028699, "epoch": 1.2564678865463073, "percentage": 64.29, "elapsed_time": "1 day, 3:11:13", "remaining_time": "15:06:09", "throughput": 332.8, "total_tokens": 32572160} {"current_steps": 25720, "total_steps": 40000, "loss": 0.0747, "lr": 0.08486740480171118, "epoch": 1.2567121882100016, "percentage": 64.3, "elapsed_time": "1 day, 3:11:16", "remaining_time": "15:05:42", "throughput": 332.85, "total_tokens": 32578336} {"current_steps": 25725, "total_steps": 40000, "loss": 0.0556, "lr": 0.08481434784481706, "epoch": 1.256956489873696, "percentage": 64.31, "elapsed_time": "1 day, 3:11:19", "remaining_time": "15:05:14", "throughput": 332.91, "total_tokens": 32584736} {"current_steps": 25730, "total_steps": 40000, "loss": 0.0529, "lr": 0.08476130094036968, "epoch": 1.2572007915373904, "percentage": 64.33, "elapsed_time": "1 day, 3:11:22", "remaining_time": "15:04:46", "throughput": 332.96, "total_tokens": 32590976} {"current_steps": 25735, "total_steps": 40000, "loss": 0.0401, "lr": 0.08470826409654961, "epoch": 1.2574450932010848, "percentage": 64.34, "elapsed_time": "1 day, 3:11:25", "remaining_time": "15:04:18", "throughput": 333.02, "total_tokens": 32597600} {"current_steps": 25740, "total_steps": 40000, "loss": 0.0533, "lr": 0.08465523732153564, "epoch": 1.2576893948647792, "percentage": 64.35, "elapsed_time": "1 day, 3:11:28", "remaining_time": "15:03:50", "throughput": 333.07, "total_tokens": 32603936} {"current_steps": 25745, "total_steps": 40000, "loss": 0.0801, "lr": 0.08460222062350532, "epoch": 1.2579336965284733, "percentage": 64.36, "elapsed_time": "1 day, 3:11:31", "remaining_time": "15:03:22", "throughput": 333.12, "total_tokens": 32610144} {"current_steps": 25750, "total_steps": 40000, "loss": 0.0436, "lr": 0.08454921401063442, "epoch": 1.2581779981921677, "percentage": 64.38, "elapsed_time": "1 day, 3:11:35", "remaining_time": "15:02:54", "throughput": 333.18, "total_tokens": 32616416} {"current_steps": 25755, "total_steps": 40000, "loss": 0.0619, "lr": 0.08449621749109716, "epoch": 1.258422299855862, "percentage": 64.39, "elapsed_time": "1 day, 3:11:38", "remaining_time": "15:02:27", "throughput": 333.23, "total_tokens": 32622816} {"current_steps": 25760, "total_steps": 40000, "loss": 0.063, "lr": 0.08444323107306641, "epoch": 1.2586666015195562, "percentage": 64.4, "elapsed_time": "1 day, 3:11:41", "remaining_time": "15:01:59", "throughput": 333.28, "total_tokens": 32628896} {"current_steps": 25765, "total_steps": 40000, "loss": 0.093, "lr": 0.0843902547647132, "epoch": 1.2589109031832506, "percentage": 64.41, "elapsed_time": "1 day, 3:11:44", "remaining_time": "15:01:31", "throughput": 333.34, "total_tokens": 32635104} {"current_steps": 25770, "total_steps": 40000, "loss": 0.061, "lr": 0.0843372885742072, "epoch": 1.259155204846945, "percentage": 64.42, "elapsed_time": "1 day, 3:11:47", "remaining_time": "15:01:03", "throughput": 333.39, "total_tokens": 32641376} {"current_steps": 25775, "total_steps": 40000, "loss": 0.0495, "lr": 0.08428433250971652, "epoch": 1.2593995065106394, "percentage": 64.44, "elapsed_time": "1 day, 3:11:50", "remaining_time": "15:00:35", "throughput": 333.44, "total_tokens": 32647648} {"current_steps": 25780, "total_steps": 40000, "loss": 0.0732, "lr": 0.08423138657940757, "epoch": 1.2596438081743337, "percentage": 64.45, "elapsed_time": "1 day, 3:11:53", "remaining_time": "15:00:08", "throughput": 333.5, "total_tokens": 32653632} {"current_steps": 25785, "total_steps": 40000, "loss": 0.0546, "lr": 0.08417845079144536, "epoch": 1.2598881098380281, "percentage": 64.46, "elapsed_time": "1 day, 3:11:56", "remaining_time": "14:59:40", "throughput": 333.54, "total_tokens": 32659456} {"current_steps": 25790, "total_steps": 40000, "loss": 0.0696, "lr": 0.08412552515399314, "epoch": 1.2601324115017223, "percentage": 64.48, "elapsed_time": "1 day, 3:11:59", "remaining_time": "14:59:12", "throughput": 333.6, "total_tokens": 32665440} {"current_steps": 25795, "total_steps": 40000, "loss": 0.0375, "lr": 0.08407260967521278, "epoch": 1.2603767131654167, "percentage": 64.49, "elapsed_time": "1 day, 3:12:02", "remaining_time": "14:58:44", "throughput": 333.65, "total_tokens": 32671872} {"current_steps": 25800, "total_steps": 40000, "loss": 0.062, "lr": 0.08401970436326454, "epoch": 1.260621014829111, "percentage": 64.5, "elapsed_time": "1 day, 3:12:05", "remaining_time": "14:58:16", "throughput": 333.7, "total_tokens": 32678176} {"current_steps": 25800, "total_steps": 40000, "eval_loss": 0.06488606333732605, "epoch": 1.260621014829111, "percentage": 64.5, "elapsed_time": "1 day, 3:22:45", "remaining_time": "15:04:09", "throughput": 331.54, "total_tokens": 32678176} {"current_steps": 25805, "total_steps": 40000, "loss": 0.0479, "lr": 0.08396680922630702, "epoch": 1.2608653164928052, "percentage": 64.51, "elapsed_time": "1 day, 3:22:49", "remaining_time": "15:03:41", "throughput": 331.59, "total_tokens": 32684192} {"current_steps": 25810, "total_steps": 40000, "loss": 0.0765, "lr": 0.08391392427249732, "epoch": 1.2611096181564996, "percentage": 64.53, "elapsed_time": "1 day, 3:22:52", "remaining_time": "15:03:13", "throughput": 331.64, "total_tokens": 32689984} {"current_steps": 25815, "total_steps": 40000, "loss": 0.0612, "lr": 0.08386104950999107, "epoch": 1.261353919820194, "percentage": 64.54, "elapsed_time": "1 day, 3:22:54", "remaining_time": "15:02:45", "throughput": 331.69, "total_tokens": 32695936} {"current_steps": 25820, "total_steps": 40000, "loss": 0.0543, "lr": 0.0838081849469421, "epoch": 1.2615982214838883, "percentage": 64.55, "elapsed_time": "1 day, 3:22:58", "remaining_time": "15:02:17", "throughput": 331.74, "total_tokens": 32702336} {"current_steps": 25825, "total_steps": 40000, "loss": 0.045, "lr": 0.08375533059150281, "epoch": 1.2618425231475827, "percentage": 64.56, "elapsed_time": "1 day, 3:23:01", "remaining_time": "15:01:49", "throughput": 331.79, "total_tokens": 32708480} {"current_steps": 25830, "total_steps": 40000, "loss": 0.0442, "lr": 0.08370248645182406, "epoch": 1.262086824811277, "percentage": 64.58, "elapsed_time": "1 day, 3:23:04", "remaining_time": "15:01:22", "throughput": 331.86, "total_tokens": 32715904} {"current_steps": 25835, "total_steps": 40000, "loss": 0.0419, "lr": 0.083649652536055, "epoch": 1.2623311264749713, "percentage": 64.59, "elapsed_time": "1 day, 3:23:07", "remaining_time": "15:00:54", "throughput": 331.91, "total_tokens": 32721920} {"current_steps": 25840, "total_steps": 40000, "loss": 0.0547, "lr": 0.08359682885234339, "epoch": 1.2625754281386656, "percentage": 64.6, "elapsed_time": "1 day, 3:23:10", "remaining_time": "15:00:26", "throughput": 331.97, "total_tokens": 32728640} {"current_steps": 25845, "total_steps": 40000, "loss": 0.0623, "lr": 0.08354401540883516, "epoch": 1.26281972980236, "percentage": 64.61, "elapsed_time": "1 day, 3:23:13", "remaining_time": "14:59:58", "throughput": 332.02, "total_tokens": 32735136} {"current_steps": 25850, "total_steps": 40000, "loss": 0.0348, "lr": 0.0834912122136749, "epoch": 1.2630640314660542, "percentage": 64.62, "elapsed_time": "1 day, 3:23:16", "remaining_time": "14:59:30", "throughput": 332.07, "total_tokens": 32741440} {"current_steps": 25855, "total_steps": 40000, "loss": 0.0759, "lr": 0.0834384192750056, "epoch": 1.2633083331297486, "percentage": 64.64, "elapsed_time": "1 day, 3:23:19", "remaining_time": "14:59:02", "throughput": 332.13, "total_tokens": 32747968} {"current_steps": 25860, "total_steps": 40000, "loss": 0.0762, "lr": 0.08338563660096844, "epoch": 1.263552634793443, "percentage": 64.65, "elapsed_time": "1 day, 3:23:23", "remaining_time": "14:58:35", "throughput": 332.18, "total_tokens": 32754240} {"current_steps": 25865, "total_steps": 40000, "loss": 0.0685, "lr": 0.08333286419970329, "epoch": 1.2637969364571373, "percentage": 64.66, "elapsed_time": "1 day, 3:23:26", "remaining_time": "14:58:07", "throughput": 332.24, "total_tokens": 32761152} {"current_steps": 25870, "total_steps": 40000, "loss": 0.0573, "lr": 0.08328010207934824, "epoch": 1.2640412381208317, "percentage": 64.68, "elapsed_time": "1 day, 3:23:29", "remaining_time": "14:57:39", "throughput": 332.29, "total_tokens": 32767040} {"current_steps": 25875, "total_steps": 40000, "loss": 0.0337, "lr": 0.08322735024803989, "epoch": 1.264285539784526, "percentage": 64.69, "elapsed_time": "1 day, 3:23:32", "remaining_time": "14:57:11", "throughput": 332.35, "total_tokens": 32773760} {"current_steps": 25880, "total_steps": 40000, "loss": 0.0365, "lr": 0.08317460871391331, "epoch": 1.2645298414482202, "percentage": 64.7, "elapsed_time": "1 day, 3:23:35", "remaining_time": "14:56:44", "throughput": 332.41, "total_tokens": 32780416} {"current_steps": 25885, "total_steps": 40000, "loss": 0.0564, "lr": 0.08312187748510179, "epoch": 1.2647741431119146, "percentage": 64.71, "elapsed_time": "1 day, 3:23:38", "remaining_time": "14:56:16", "throughput": 332.46, "total_tokens": 32786400} {"current_steps": 25890, "total_steps": 40000, "loss": 0.0779, "lr": 0.08306915656973726, "epoch": 1.265018444775609, "percentage": 64.72, "elapsed_time": "1 day, 3:23:41", "remaining_time": "14:55:48", "throughput": 332.51, "total_tokens": 32792704} {"current_steps": 25895, "total_steps": 40000, "loss": 0.0581, "lr": 0.08301644597594988, "epoch": 1.2652627464393031, "percentage": 64.74, "elapsed_time": "1 day, 3:23:44", "remaining_time": "14:55:20", "throughput": 332.56, "total_tokens": 32798912} {"current_steps": 25900, "total_steps": 40000, "loss": 0.0939, "lr": 0.08296374571186826, "epoch": 1.2655070481029975, "percentage": 64.75, "elapsed_time": "1 day, 3:23:47", "remaining_time": "14:54:53", "throughput": 332.61, "total_tokens": 32804768} {"current_steps": 25905, "total_steps": 40000, "loss": 0.076, "lr": 0.08291105578561955, "epoch": 1.265751349766692, "percentage": 64.76, "elapsed_time": "1 day, 3:23:50", "remaining_time": "14:54:25", "throughput": 332.67, "total_tokens": 32811200} {"current_steps": 25910, "total_steps": 40000, "loss": 0.0407, "lr": 0.08285837620532904, "epoch": 1.2659956514303863, "percentage": 64.78, "elapsed_time": "1 day, 3:23:53", "remaining_time": "14:53:57", "throughput": 332.72, "total_tokens": 32817088} {"current_steps": 25915, "total_steps": 40000, "loss": 0.0429, "lr": 0.0828057069791207, "epoch": 1.2662399530940807, "percentage": 64.79, "elapsed_time": "1 day, 3:23:56", "remaining_time": "14:53:29", "throughput": 332.77, "total_tokens": 32823552} {"current_steps": 25920, "total_steps": 40000, "loss": 0.0649, "lr": 0.0827530481151168, "epoch": 1.2664842547577748, "percentage": 64.8, "elapsed_time": "1 day, 3:24:00", "remaining_time": "14:53:02", "throughput": 332.83, "total_tokens": 32830464} {"current_steps": 25925, "total_steps": 40000, "loss": 0.0685, "lr": 0.08270039962143792, "epoch": 1.2667285564214692, "percentage": 64.81, "elapsed_time": "1 day, 3:24:03", "remaining_time": "14:52:34", "throughput": 332.89, "total_tokens": 32837184} {"current_steps": 25930, "total_steps": 40000, "loss": 0.0548, "lr": 0.08264776150620314, "epoch": 1.2669728580851636, "percentage": 64.83, "elapsed_time": "1 day, 3:24:06", "remaining_time": "14:52:07", "throughput": 332.94, "total_tokens": 32843808} {"current_steps": 25935, "total_steps": 40000, "loss": 0.076, "lr": 0.08259513377753, "epoch": 1.267217159748858, "percentage": 64.84, "elapsed_time": "1 day, 3:24:09", "remaining_time": "14:51:39", "throughput": 333.0, "total_tokens": 32850272} {"current_steps": 25940, "total_steps": 40000, "loss": 0.0494, "lr": 0.08254251644353423, "epoch": 1.2674614614125521, "percentage": 64.85, "elapsed_time": "1 day, 3:24:12", "remaining_time": "14:51:11", "throughput": 333.05, "total_tokens": 32856352} {"current_steps": 25945, "total_steps": 40000, "loss": 0.0533, "lr": 0.08248990951233022, "epoch": 1.2677057630762465, "percentage": 64.86, "elapsed_time": "1 day, 3:24:15", "remaining_time": "14:50:44", "throughput": 333.11, "total_tokens": 32863232} {"current_steps": 25950, "total_steps": 40000, "loss": 0.0801, "lr": 0.08243731299203048, "epoch": 1.2679500647399409, "percentage": 64.88, "elapsed_time": "1 day, 3:24:18", "remaining_time": "14:50:16", "throughput": 333.16, "total_tokens": 32869440} {"current_steps": 25955, "total_steps": 40000, "loss": 0.0726, "lr": 0.08238472689074612, "epoch": 1.2681943664036353, "percentage": 64.89, "elapsed_time": "1 day, 3:24:22", "remaining_time": "14:49:48", "throughput": 333.22, "total_tokens": 32875712} {"current_steps": 25960, "total_steps": 40000, "loss": 0.067, "lr": 0.08233215121658666, "epoch": 1.2684386680673296, "percentage": 64.9, "elapsed_time": "1 day, 3:24:25", "remaining_time": "14:49:21", "throughput": 333.27, "total_tokens": 32881728} {"current_steps": 25965, "total_steps": 40000, "loss": 0.063, "lr": 0.08227958597765982, "epoch": 1.2686829697310238, "percentage": 64.91, "elapsed_time": "1 day, 3:24:28", "remaining_time": "14:48:53", "throughput": 333.32, "total_tokens": 32887904} {"current_steps": 25970, "total_steps": 40000, "loss": 0.0554, "lr": 0.08222703118207181, "epoch": 1.2689272713947182, "percentage": 64.92, "elapsed_time": "1 day, 3:24:31", "remaining_time": "14:48:26", "throughput": 333.37, "total_tokens": 32894048} {"current_steps": 25975, "total_steps": 40000, "loss": 0.0737, "lr": 0.08217448683792734, "epoch": 1.2691715730584125, "percentage": 64.94, "elapsed_time": "1 day, 3:24:34", "remaining_time": "14:47:58", "throughput": 333.42, "total_tokens": 32900160} {"current_steps": 25980, "total_steps": 40000, "loss": 0.0558, "lr": 0.08212195295332926, "epoch": 1.269415874722107, "percentage": 64.95, "elapsed_time": "1 day, 3:24:37", "remaining_time": "14:47:30", "throughput": 333.48, "total_tokens": 32906496} {"current_steps": 25985, "total_steps": 40000, "loss": 0.0534, "lr": 0.08206942953637915, "epoch": 1.269660176385801, "percentage": 64.96, "elapsed_time": "1 day, 3:24:40", "remaining_time": "14:47:03", "throughput": 333.53, "total_tokens": 32912992} {"current_steps": 25990, "total_steps": 40000, "loss": 0.0561, "lr": 0.08201691659517658, "epoch": 1.2699044780494955, "percentage": 64.98, "elapsed_time": "1 day, 3:24:43", "remaining_time": "14:46:35", "throughput": 333.59, "total_tokens": 32919488} {"current_steps": 25995, "total_steps": 40000, "loss": 0.082, "lr": 0.08196441413781981, "epoch": 1.2701487797131898, "percentage": 64.99, "elapsed_time": "1 day, 3:24:46", "remaining_time": "14:46:08", "throughput": 333.64, "total_tokens": 32925536} {"current_steps": 26000, "total_steps": 40000, "loss": 0.0715, "lr": 0.08191192217240544, "epoch": 1.2703930813768842, "percentage": 65.0, "elapsed_time": "1 day, 3:24:49", "remaining_time": "14:45:40", "throughput": 333.69, "total_tokens": 32931456} {"current_steps": 26000, "total_steps": 40000, "eval_loss": 0.06263794749975204, "epoch": 1.2703930813768842, "percentage": 65.0, "elapsed_time": "1 day, 3:35:29", "remaining_time": "14:51:25", "throughput": 331.54, "total_tokens": 32931456} {"current_steps": 26005, "total_steps": 40000, "loss": 0.0691, "lr": 0.08185944070702823, "epoch": 1.2706373830405786, "percentage": 65.01, "elapsed_time": "1 day, 3:35:33", "remaining_time": "14:50:58", "throughput": 331.59, "total_tokens": 32937920} {"current_steps": 26010, "total_steps": 40000, "loss": 0.0567, "lr": 0.08180696974978159, "epoch": 1.2708816847042728, "percentage": 65.03, "elapsed_time": "1 day, 3:35:37", "remaining_time": "14:50:30", "throughput": 331.64, "total_tokens": 32944384} {"current_steps": 26015, "total_steps": 40000, "loss": 0.0619, "lr": 0.08175450930875724, "epoch": 1.2711259863679671, "percentage": 65.04, "elapsed_time": "1 day, 3:35:40", "remaining_time": "14:50:02", "throughput": 331.69, "total_tokens": 32950560} {"current_steps": 26020, "total_steps": 40000, "loss": 0.0442, "lr": 0.08170205939204513, "epoch": 1.2713702880316615, "percentage": 65.05, "elapsed_time": "1 day, 3:35:43", "remaining_time": "14:49:35", "throughput": 331.75, "total_tokens": 32956768} {"current_steps": 26025, "total_steps": 40000, "loss": 0.0455, "lr": 0.08164962000773379, "epoch": 1.271614589695356, "percentage": 65.06, "elapsed_time": "1 day, 3:35:46", "remaining_time": "14:49:07", "throughput": 331.8, "total_tokens": 32963200} {"current_steps": 26030, "total_steps": 40000, "loss": 0.0545, "lr": 0.08159719116390995, "epoch": 1.27185889135905, "percentage": 65.08, "elapsed_time": "1 day, 3:35:49", "remaining_time": "14:48:39", "throughput": 331.85, "total_tokens": 32969312} {"current_steps": 26035, "total_steps": 40000, "loss": 0.0391, "lr": 0.08154477286865887, "epoch": 1.2721031930227444, "percentage": 65.09, "elapsed_time": "1 day, 3:35:52", "remaining_time": "14:48:11", "throughput": 331.9, "total_tokens": 32975520} {"current_steps": 26040, "total_steps": 40000, "loss": 0.0636, "lr": 0.08149236513006404, "epoch": 1.2723474946864388, "percentage": 65.1, "elapsed_time": "1 day, 3:35:55", "remaining_time": "14:47:44", "throughput": 331.96, "total_tokens": 32981600} {"current_steps": 26045, "total_steps": 40000, "loss": 0.0396, "lr": 0.08143996795620746, "epoch": 1.2725917963501332, "percentage": 65.11, "elapsed_time": "1 day, 3:35:58", "remaining_time": "14:47:16", "throughput": 332.01, "total_tokens": 32987776} {"current_steps": 26050, "total_steps": 40000, "loss": 0.0537, "lr": 0.08138758135516938, "epoch": 1.2728360980138276, "percentage": 65.12, "elapsed_time": "1 day, 3:36:01", "remaining_time": "14:46:48", "throughput": 332.07, "total_tokens": 32994592} {"current_steps": 26055, "total_steps": 40000, "loss": 0.0589, "lr": 0.08133520533502851, "epoch": 1.2730803996775217, "percentage": 65.14, "elapsed_time": "1 day, 3:36:04", "remaining_time": "14:46:21", "throughput": 332.12, "total_tokens": 33000992} {"current_steps": 26060, "total_steps": 40000, "loss": 0.0489, "lr": 0.08128283990386184, "epoch": 1.2733247013412161, "percentage": 65.15, "elapsed_time": "1 day, 3:36:07", "remaining_time": "14:45:53", "throughput": 332.17, "total_tokens": 33007168} {"current_steps": 26065, "total_steps": 40000, "loss": 0.0545, "lr": 0.08123048506974488, "epoch": 1.2735690030049105, "percentage": 65.16, "elapsed_time": "1 day, 3:36:10", "remaining_time": "14:45:26", "throughput": 332.23, "total_tokens": 33013536} {"current_steps": 26070, "total_steps": 40000, "loss": 0.0648, "lr": 0.08117814084075124, "epoch": 1.2738133046686049, "percentage": 65.18, "elapsed_time": "1 day, 3:36:13", "remaining_time": "14:44:58", "throughput": 332.28, "total_tokens": 33019872} {"current_steps": 26075, "total_steps": 40000, "loss": 0.0501, "lr": 0.08112580722495318, "epoch": 1.274057606332299, "percentage": 65.19, "elapsed_time": "1 day, 3:36:17", "remaining_time": "14:44:30", "throughput": 332.33, "total_tokens": 33026272} {"current_steps": 26080, "total_steps": 40000, "loss": 0.024, "lr": 0.08107348423042122, "epoch": 1.2743019079959934, "percentage": 65.2, "elapsed_time": "1 day, 3:36:20", "remaining_time": "14:44:03", "throughput": 332.38, "total_tokens": 33032256} {"current_steps": 26085, "total_steps": 40000, "loss": 0.0401, "lr": 0.08102117186522413, "epoch": 1.2745462096596878, "percentage": 65.21, "elapsed_time": "1 day, 3:36:23", "remaining_time": "14:43:35", "throughput": 332.44, "total_tokens": 33038464} {"current_steps": 26090, "total_steps": 40000, "loss": 0.0301, "lr": 0.08096887013742916, "epoch": 1.2747905113233822, "percentage": 65.22, "elapsed_time": "1 day, 3:36:26", "remaining_time": "14:43:08", "throughput": 332.49, "total_tokens": 33045088} {"current_steps": 26095, "total_steps": 40000, "loss": 0.0644, "lr": 0.08091657905510198, "epoch": 1.2750348129870765, "percentage": 65.24, "elapsed_time": "1 day, 3:36:29", "remaining_time": "14:42:40", "throughput": 332.55, "total_tokens": 33051424} {"current_steps": 26100, "total_steps": 40000, "loss": 0.0474, "lr": 0.08086429862630642, "epoch": 1.2752791146507707, "percentage": 65.25, "elapsed_time": "1 day, 3:36:32", "remaining_time": "14:42:13", "throughput": 332.6, "total_tokens": 33057888} {"current_steps": 26105, "total_steps": 40000, "loss": 0.0365, "lr": 0.08081202885910488, "epoch": 1.275523416314465, "percentage": 65.26, "elapsed_time": "1 day, 3:36:35", "remaining_time": "14:41:45", "throughput": 332.66, "total_tokens": 33064768} {"current_steps": 26110, "total_steps": 40000, "loss": 0.0604, "lr": 0.08075976976155795, "epoch": 1.2757677179781595, "percentage": 65.28, "elapsed_time": "1 day, 3:36:38", "remaining_time": "14:41:18", "throughput": 332.71, "total_tokens": 33070720} {"current_steps": 26115, "total_steps": 40000, "loss": 0.0345, "lr": 0.08070752134172461, "epoch": 1.2760120196418536, "percentage": 65.29, "elapsed_time": "1 day, 3:36:41", "remaining_time": "14:40:50", "throughput": 332.76, "total_tokens": 33076896} {"current_steps": 26120, "total_steps": 40000, "loss": 0.0507, "lr": 0.08065528360766229, "epoch": 1.276256321305548, "percentage": 65.3, "elapsed_time": "1 day, 3:36:44", "remaining_time": "14:40:23", "throughput": 332.81, "total_tokens": 33083072} {"current_steps": 26125, "total_steps": 40000, "loss": 0.059, "lr": 0.08060305656742664, "epoch": 1.2765006229692424, "percentage": 65.31, "elapsed_time": "1 day, 3:36:47", "remaining_time": "14:39:55", "throughput": 332.87, "total_tokens": 33089536} {"current_steps": 26130, "total_steps": 40000, "loss": 0.0617, "lr": 0.08055084022907182, "epoch": 1.2767449246329368, "percentage": 65.33, "elapsed_time": "1 day, 3:36:51", "remaining_time": "14:39:28", "throughput": 332.92, "total_tokens": 33095872} {"current_steps": 26135, "total_steps": 40000, "loss": 0.0429, "lr": 0.08049863460065014, "epoch": 1.2769892262966311, "percentage": 65.34, "elapsed_time": "1 day, 3:36:54", "remaining_time": "14:39:00", "throughput": 332.98, "total_tokens": 33102464} {"current_steps": 26140, "total_steps": 40000, "loss": 0.0456, "lr": 0.0804464396902124, "epoch": 1.2772335279603255, "percentage": 65.35, "elapsed_time": "1 day, 3:36:57", "remaining_time": "14:38:33", "throughput": 333.03, "total_tokens": 33108800} {"current_steps": 26145, "total_steps": 40000, "loss": 0.0564, "lr": 0.08039425550580777, "epoch": 1.2774778296240197, "percentage": 65.36, "elapsed_time": "1 day, 3:37:00", "remaining_time": "14:38:05", "throughput": 333.08, "total_tokens": 33115392} {"current_steps": 26150, "total_steps": 40000, "loss": 0.0505, "lr": 0.08034208205548363, "epoch": 1.277722131287714, "percentage": 65.38, "elapsed_time": "1 day, 3:37:03", "remaining_time": "14:37:38", "throughput": 333.14, "total_tokens": 33121888} {"current_steps": 26155, "total_steps": 40000, "loss": 0.0981, "lr": 0.08028991934728581, "epoch": 1.2779664329514084, "percentage": 65.39, "elapsed_time": "1 day, 3:37:06", "remaining_time": "14:37:10", "throughput": 333.19, "total_tokens": 33128192} {"current_steps": 26160, "total_steps": 40000, "loss": 0.0695, "lr": 0.0802377673892585, "epoch": 1.2782107346151026, "percentage": 65.4, "elapsed_time": "1 day, 3:37:09", "remaining_time": "14:36:43", "throughput": 333.25, "total_tokens": 33134432} {"current_steps": 26165, "total_steps": 40000, "loss": 0.069, "lr": 0.0801856261894441, "epoch": 1.278455036278797, "percentage": 65.41, "elapsed_time": "1 day, 3:37:12", "remaining_time": "14:36:15", "throughput": 333.3, "total_tokens": 33140480} {"current_steps": 26170, "total_steps": 40000, "loss": 0.0496, "lr": 0.08013349575588354, "epoch": 1.2786993379424914, "percentage": 65.42, "elapsed_time": "1 day, 3:37:15", "remaining_time": "14:35:48", "throughput": 333.35, "total_tokens": 33146432} {"current_steps": 26175, "total_steps": 40000, "loss": 0.0506, "lr": 0.08008137609661586, "epoch": 1.2789436396061857, "percentage": 65.44, "elapsed_time": "1 day, 3:37:18", "remaining_time": "14:35:21", "throughput": 333.4, "total_tokens": 33152576} {"current_steps": 26180, "total_steps": 40000, "loss": 0.0668, "lr": 0.08002926721967872, "epoch": 1.2791879412698801, "percentage": 65.45, "elapsed_time": "1 day, 3:37:21", "remaining_time": "14:34:53", "throughput": 333.45, "total_tokens": 33158816} {"current_steps": 26185, "total_steps": 40000, "loss": 0.0566, "lr": 0.07997716913310782, "epoch": 1.2794322429335745, "percentage": 65.46, "elapsed_time": "1 day, 3:37:24", "remaining_time": "14:34:26", "throughput": 333.5, "total_tokens": 33164800} {"current_steps": 26190, "total_steps": 40000, "loss": 0.0673, "lr": 0.07992508184493745, "epoch": 1.2796765445972687, "percentage": 65.48, "elapsed_time": "1 day, 3:37:27", "remaining_time": "14:33:58", "throughput": 333.55, "total_tokens": 33170976} {"current_steps": 26195, "total_steps": 40000, "loss": 0.0554, "lr": 0.07987300536320001, "epoch": 1.279920846260963, "percentage": 65.49, "elapsed_time": "1 day, 3:37:30", "remaining_time": "14:33:31", "throughput": 333.61, "total_tokens": 33177536} {"current_steps": 26200, "total_steps": 40000, "loss": 0.056, "lr": 0.07982093969592649, "epoch": 1.2801651479246574, "percentage": 65.5, "elapsed_time": "1 day, 3:37:33", "remaining_time": "14:33:04", "throughput": 333.66, "total_tokens": 33184096} {"current_steps": 26200, "total_steps": 40000, "eval_loss": 0.06283564120531082, "epoch": 1.2801651479246574, "percentage": 65.5, "elapsed_time": "1 day, 3:48:13", "remaining_time": "14:38:40", "throughput": 331.53, "total_tokens": 33184096} {"current_steps": 26205, "total_steps": 40000, "loss": 0.0359, "lr": 0.07976888485114592, "epoch": 1.2804094495883516, "percentage": 65.51, "elapsed_time": "1 day, 3:48:17", "remaining_time": "14:38:13", "throughput": 331.58, "total_tokens": 33190240} {"current_steps": 26210, "total_steps": 40000, "loss": 0.0501, "lr": 0.07971684083688595, "epoch": 1.280653751252046, "percentage": 65.53, "elapsed_time": "1 day, 3:48:20", "remaining_time": "14:37:46", "throughput": 331.63, "total_tokens": 33196288} {"current_steps": 26215, "total_steps": 40000, "loss": 0.0431, "lr": 0.0796648076611723, "epoch": 1.2808980529157403, "percentage": 65.54, "elapsed_time": "1 day, 3:48:23", "remaining_time": "14:37:18", "throughput": 331.68, "total_tokens": 33202080} {"current_steps": 26220, "total_steps": 40000, "loss": 0.0529, "lr": 0.07961278533202922, "epoch": 1.2811423545794347, "percentage": 65.55, "elapsed_time": "1 day, 3:48:26", "remaining_time": "14:36:51", "throughput": 331.73, "total_tokens": 33208416} {"current_steps": 26225, "total_steps": 40000, "loss": 0.0326, "lr": 0.07956077385747919, "epoch": 1.281386656243129, "percentage": 65.56, "elapsed_time": "1 day, 3:48:29", "remaining_time": "14:36:23", "throughput": 331.79, "total_tokens": 33215072} {"current_steps": 26230, "total_steps": 40000, "loss": 0.0462, "lr": 0.079508773245543, "epoch": 1.2816309579068235, "percentage": 65.58, "elapsed_time": "1 day, 3:48:32", "remaining_time": "14:35:56", "throughput": 331.84, "total_tokens": 33221696} {"current_steps": 26235, "total_steps": 40000, "loss": 0.0635, "lr": 0.07945678350423982, "epoch": 1.2818752595705176, "percentage": 65.59, "elapsed_time": "1 day, 3:48:35", "remaining_time": "14:35:28", "throughput": 331.9, "total_tokens": 33228192} {"current_steps": 26240, "total_steps": 40000, "loss": 0.0383, "lr": 0.07940480464158717, "epoch": 1.282119561234212, "percentage": 65.6, "elapsed_time": "1 day, 3:48:38", "remaining_time": "14:35:01", "throughput": 331.95, "total_tokens": 33234240} {"current_steps": 26245, "total_steps": 40000, "loss": 0.0571, "lr": 0.07935283666560076, "epoch": 1.2823638628979064, "percentage": 65.61, "elapsed_time": "1 day, 3:48:41", "remaining_time": "14:34:33", "throughput": 332.0, "total_tokens": 33240512} {"current_steps": 26250, "total_steps": 40000, "loss": 0.0571, "lr": 0.07930087958429478, "epoch": 1.2826081645616005, "percentage": 65.62, "elapsed_time": "1 day, 3:48:45", "remaining_time": "14:34:06", "throughput": 332.06, "total_tokens": 33247648} {"current_steps": 26255, "total_steps": 40000, "loss": 0.0537, "lr": 0.07924893340568159, "epoch": 1.282852466225295, "percentage": 65.64, "elapsed_time": "1 day, 3:48:48", "remaining_time": "14:33:39", "throughput": 332.11, "total_tokens": 33254016} {"current_steps": 26260, "total_steps": 40000, "loss": 0.0696, "lr": 0.07919699813777205, "epoch": 1.2830967678889893, "percentage": 65.65, "elapsed_time": "1 day, 3:48:51", "remaining_time": "14:33:11", "throughput": 332.17, "total_tokens": 33260352} {"current_steps": 26265, "total_steps": 40000, "loss": 0.0409, "lr": 0.07914507378857515, "epoch": 1.2833410695526837, "percentage": 65.66, "elapsed_time": "1 day, 3:48:54", "remaining_time": "14:32:44", "throughput": 332.22, "total_tokens": 33266976} {"current_steps": 26270, "total_steps": 40000, "loss": 0.0733, "lr": 0.07909316036609822, "epoch": 1.283585371216378, "percentage": 65.67, "elapsed_time": "1 day, 3:48:57", "remaining_time": "14:32:16", "throughput": 332.27, "total_tokens": 33273056} {"current_steps": 26275, "total_steps": 40000, "loss": 0.0424, "lr": 0.07904125787834704, "epoch": 1.2838296728800724, "percentage": 65.69, "elapsed_time": "1 day, 3:49:00", "remaining_time": "14:31:49", "throughput": 332.32, "total_tokens": 33278976} {"current_steps": 26280, "total_steps": 40000, "loss": 0.0437, "lr": 0.07898936633332569, "epoch": 1.2840739745437666, "percentage": 65.7, "elapsed_time": "1 day, 3:49:03", "remaining_time": "14:31:21", "throughput": 332.37, "total_tokens": 33285056} {"current_steps": 26285, "total_steps": 40000, "loss": 0.0322, "lr": 0.07893748573903635, "epoch": 1.284318276207461, "percentage": 65.71, "elapsed_time": "1 day, 3:49:06", "remaining_time": "14:30:54", "throughput": 332.43, "total_tokens": 33291232} {"current_steps": 26290, "total_steps": 40000, "loss": 0.0579, "lr": 0.0788856161034798, "epoch": 1.2845625778711554, "percentage": 65.72, "elapsed_time": "1 day, 3:49:09", "remaining_time": "14:30:27", "throughput": 332.48, "total_tokens": 33297472} {"current_steps": 26295, "total_steps": 40000, "loss": 0.0338, "lr": 0.07883375743465487, "epoch": 1.2848068795348495, "percentage": 65.74, "elapsed_time": "1 day, 3:49:12", "remaining_time": "14:29:59", "throughput": 332.53, "total_tokens": 33303552} {"current_steps": 26300, "total_steps": 40000, "loss": 0.0627, "lr": 0.07878190974055888, "epoch": 1.285051181198544, "percentage": 65.75, "elapsed_time": "1 day, 3:49:15", "remaining_time": "14:29:32", "throughput": 332.58, "total_tokens": 33309760} {"current_steps": 26305, "total_steps": 40000, "loss": 0.0825, "lr": 0.07873007302918746, "epoch": 1.2852954828622383, "percentage": 65.76, "elapsed_time": "1 day, 3:49:18", "remaining_time": "14:29:04", "throughput": 332.64, "total_tokens": 33316320} {"current_steps": 26310, "total_steps": 40000, "loss": 0.0354, "lr": 0.07867824730853433, "epoch": 1.2855397845259326, "percentage": 65.77, "elapsed_time": "1 day, 3:49:21", "remaining_time": "14:28:37", "throughput": 332.69, "total_tokens": 33322560} {"current_steps": 26315, "total_steps": 40000, "loss": 0.0573, "lr": 0.07862643258659176, "epoch": 1.285784086189627, "percentage": 65.79, "elapsed_time": "1 day, 3:49:24", "remaining_time": "14:28:10", "throughput": 332.74, "total_tokens": 33328992} {"current_steps": 26320, "total_steps": 40000, "loss": 0.0359, "lr": 0.07857462887135026, "epoch": 1.2860283878533214, "percentage": 65.8, "elapsed_time": "1 day, 3:49:28", "remaining_time": "14:27:43", "throughput": 332.79, "total_tokens": 33335328} {"current_steps": 26325, "total_steps": 40000, "loss": 0.0373, "lr": 0.0785228361707986, "epoch": 1.2862726895170156, "percentage": 65.81, "elapsed_time": "1 day, 3:49:31", "remaining_time": "14:27:15", "throughput": 332.85, "total_tokens": 33341856} {"current_steps": 26330, "total_steps": 40000, "loss": 0.0432, "lr": 0.07847105449292378, "epoch": 1.28651699118071, "percentage": 65.83, "elapsed_time": "1 day, 3:49:34", "remaining_time": "14:26:48", "throughput": 332.9, "total_tokens": 33348064} {"current_steps": 26335, "total_steps": 40000, "loss": 0.0545, "lr": 0.0784192838457113, "epoch": 1.2867612928444043, "percentage": 65.84, "elapsed_time": "1 day, 3:49:37", "remaining_time": "14:26:21", "throughput": 332.95, "total_tokens": 33354336} {"current_steps": 26340, "total_steps": 40000, "loss": 0.0417, "lr": 0.07836752423714473, "epoch": 1.2870055945080985, "percentage": 65.85, "elapsed_time": "1 day, 3:49:40", "remaining_time": "14:25:53", "throughput": 333.01, "total_tokens": 33360704} {"current_steps": 26345, "total_steps": 40000, "loss": 0.045, "lr": 0.07831577567520616, "epoch": 1.2872498961717929, "percentage": 65.86, "elapsed_time": "1 day, 3:49:43", "remaining_time": "14:25:26", "throughput": 333.06, "total_tokens": 33366752} {"current_steps": 26350, "total_steps": 40000, "loss": 0.0656, "lr": 0.07826403816787579, "epoch": 1.2874941978354872, "percentage": 65.88, "elapsed_time": "1 day, 3:49:46", "remaining_time": "14:24:59", "throughput": 333.11, "total_tokens": 33373024} {"current_steps": 26355, "total_steps": 40000, "loss": 0.0373, "lr": 0.0782123117231322, "epoch": 1.2877384994991816, "percentage": 65.89, "elapsed_time": "1 day, 3:49:49", "remaining_time": "14:24:32", "throughput": 333.16, "total_tokens": 33379584} {"current_steps": 26360, "total_steps": 40000, "loss": 0.0295, "lr": 0.07816059634895237, "epoch": 1.287982801162876, "percentage": 65.9, "elapsed_time": "1 day, 3:49:52", "remaining_time": "14:24:04", "throughput": 333.22, "total_tokens": 33386048} {"current_steps": 26365, "total_steps": 40000, "loss": 0.0884, "lr": 0.0781088920533113, "epoch": 1.2882271028265704, "percentage": 65.91, "elapsed_time": "1 day, 3:49:55", "remaining_time": "14:23:37", "throughput": 333.27, "total_tokens": 33391936} {"current_steps": 26370, "total_steps": 40000, "loss": 0.0552, "lr": 0.07805719884418257, "epoch": 1.2884714044902645, "percentage": 65.92, "elapsed_time": "1 day, 3:49:58", "remaining_time": "14:23:10", "throughput": 333.32, "total_tokens": 33398784} {"current_steps": 26375, "total_steps": 40000, "loss": 0.0548, "lr": 0.07800551672953779, "epoch": 1.288715706153959, "percentage": 65.94, "elapsed_time": "1 day, 3:50:01", "remaining_time": "14:22:43", "throughput": 333.37, "total_tokens": 33404704} {"current_steps": 26380, "total_steps": 40000, "loss": 0.0767, "lr": 0.07795384571734709, "epoch": 1.2889600078176533, "percentage": 65.95, "elapsed_time": "1 day, 3:50:05", "remaining_time": "14:22:15", "throughput": 333.43, "total_tokens": 33411680} {"current_steps": 26385, "total_steps": 40000, "loss": 0.1135, "lr": 0.07790218581557883, "epoch": 1.2892043094813475, "percentage": 65.96, "elapsed_time": "1 day, 3:50:08", "remaining_time": "14:21:48", "throughput": 333.48, "total_tokens": 33417664} {"current_steps": 26390, "total_steps": 40000, "loss": 0.0902, "lr": 0.07785053703219949, "epoch": 1.2894486111450418, "percentage": 65.97, "elapsed_time": "1 day, 3:50:11", "remaining_time": "14:21:21", "throughput": 333.54, "total_tokens": 33424000} {"current_steps": 26395, "total_steps": 40000, "loss": 0.0536, "lr": 0.07779889937517409, "epoch": 1.2896929128087362, "percentage": 65.99, "elapsed_time": "1 day, 3:50:14", "remaining_time": "14:20:54", "throughput": 333.59, "total_tokens": 33430144} {"current_steps": 26400, "total_steps": 40000, "loss": 0.0696, "lr": 0.0777472728524657, "epoch": 1.2899372144724306, "percentage": 66.0, "elapsed_time": "1 day, 3:50:17", "remaining_time": "14:20:27", "throughput": 333.64, "total_tokens": 33436864} {"current_steps": 26400, "total_steps": 40000, "eval_loss": 0.06357955187559128, "epoch": 1.2899372144724306, "percentage": 66.0, "elapsed_time": "1 day, 4:00:57", "remaining_time": "14:25:56", "throughput": 331.53, "total_tokens": 33436864} {"current_steps": 26405, "total_steps": 40000, "loss": 0.0466, "lr": 0.07769565747203584, "epoch": 1.290181516136125, "percentage": 66.01, "elapsed_time": "1 day, 4:01:02", "remaining_time": "14:25:30", "throughput": 331.57, "total_tokens": 33443264} {"current_steps": 26410, "total_steps": 40000, "loss": 0.0717, "lr": 0.07764405324184427, "epoch": 1.2904258177998194, "percentage": 66.03, "elapsed_time": "1 day, 4:01:05", "remaining_time": "14:25:03", "throughput": 331.63, "total_tokens": 33449536} {"current_steps": 26415, "total_steps": 40000, "loss": 0.0498, "lr": 0.07759246016984889, "epoch": 1.2906701194635135, "percentage": 66.04, "elapsed_time": "1 day, 4:01:08", "remaining_time": "14:24:35", "throughput": 331.68, "total_tokens": 33455616} {"current_steps": 26420, "total_steps": 40000, "loss": 0.0551, "lr": 0.07754087826400609, "epoch": 1.290914421127208, "percentage": 66.05, "elapsed_time": "1 day, 4:01:11", "remaining_time": "14:24:08", "throughput": 331.73, "total_tokens": 33462464} {"current_steps": 26425, "total_steps": 40000, "loss": 0.0743, "lr": 0.0774893075322705, "epoch": 1.2911587227909023, "percentage": 66.06, "elapsed_time": "1 day, 4:01:14", "remaining_time": "14:23:41", "throughput": 331.78, "total_tokens": 33468640} {"current_steps": 26430, "total_steps": 40000, "loss": 0.0366, "lr": 0.07743774798259484, "epoch": 1.2914030244545964, "percentage": 66.07, "elapsed_time": "1 day, 4:01:17", "remaining_time": "14:23:13", "throughput": 331.83, "total_tokens": 33474592} {"current_steps": 26435, "total_steps": 40000, "loss": 0.048, "lr": 0.07738619962293032, "epoch": 1.2916473261182908, "percentage": 66.09, "elapsed_time": "1 day, 4:01:20", "remaining_time": "14:22:46", "throughput": 331.88, "total_tokens": 33480736} {"current_steps": 26440, "total_steps": 40000, "loss": 0.0664, "lr": 0.0773346624612264, "epoch": 1.2918916277819852, "percentage": 66.1, "elapsed_time": "1 day, 4:01:23", "remaining_time": "14:22:19", "throughput": 331.93, "total_tokens": 33486784} {"current_steps": 26445, "total_steps": 40000, "loss": 0.0634, "lr": 0.07728313650543066, "epoch": 1.2921359294456796, "percentage": 66.11, "elapsed_time": "1 day, 4:01:26", "remaining_time": "14:21:51", "throughput": 331.98, "total_tokens": 33492608} {"current_steps": 26450, "total_steps": 40000, "loss": 0.0698, "lr": 0.07723162176348913, "epoch": 1.292380231109374, "percentage": 66.12, "elapsed_time": "1 day, 4:01:29", "remaining_time": "14:21:24", "throughput": 332.03, "total_tokens": 33498240} {"current_steps": 26455, "total_steps": 40000, "loss": 0.0712, "lr": 0.07718011824334593, "epoch": 1.292624532773068, "percentage": 66.14, "elapsed_time": "1 day, 4:01:32", "remaining_time": "14:20:57", "throughput": 332.08, "total_tokens": 33504672} {"current_steps": 26460, "total_steps": 40000, "loss": 0.0632, "lr": 0.07712862595294363, "epoch": 1.2928688344367625, "percentage": 66.15, "elapsed_time": "1 day, 4:01:35", "remaining_time": "14:20:30", "throughput": 332.13, "total_tokens": 33511040} {"current_steps": 26465, "total_steps": 40000, "loss": 0.0715, "lr": 0.07707714490022301, "epoch": 1.2931131361004569, "percentage": 66.16, "elapsed_time": "1 day, 4:01:38", "remaining_time": "14:20:02", "throughput": 332.19, "total_tokens": 33517152} {"current_steps": 26470, "total_steps": 40000, "loss": 0.055, "lr": 0.07702567509312298, "epoch": 1.2933574377641512, "percentage": 66.17, "elapsed_time": "1 day, 4:01:42", "remaining_time": "14:19:35", "throughput": 332.25, "total_tokens": 33524800} {"current_steps": 26475, "total_steps": 40000, "loss": 0.0581, "lr": 0.07697421653958098, "epoch": 1.2936017394278454, "percentage": 66.19, "elapsed_time": "1 day, 4:01:45", "remaining_time": "14:19:08", "throughput": 332.31, "total_tokens": 33531744} {"current_steps": 26480, "total_steps": 40000, "loss": 0.0858, "lr": 0.07692276924753247, "epoch": 1.2938460410915398, "percentage": 66.2, "elapsed_time": "1 day, 4:01:48", "remaining_time": "14:18:41", "throughput": 332.36, "total_tokens": 33538112} {"current_steps": 26485, "total_steps": 40000, "loss": 0.1084, "lr": 0.07687133322491124, "epoch": 1.2940903427552342, "percentage": 66.21, "elapsed_time": "1 day, 4:01:51", "remaining_time": "14:18:14", "throughput": 332.42, "total_tokens": 33545024} {"current_steps": 26490, "total_steps": 40000, "loss": 0.0424, "lr": 0.07681990847964948, "epoch": 1.2943346444189285, "percentage": 66.22, "elapsed_time": "1 day, 4:01:54", "remaining_time": "14:17:46", "throughput": 332.47, "total_tokens": 33551264} {"current_steps": 26495, "total_steps": 40000, "loss": 0.0622, "lr": 0.0767684950196774, "epoch": 1.294578946082623, "percentage": 66.24, "elapsed_time": "1 day, 4:01:57", "remaining_time": "14:17:19", "throughput": 332.52, "total_tokens": 33557440} {"current_steps": 26500, "total_steps": 40000, "loss": 0.0515, "lr": 0.0767170928529237, "epoch": 1.294823247746317, "percentage": 66.25, "elapsed_time": "1 day, 4:02:00", "remaining_time": "14:16:52", "throughput": 332.57, "total_tokens": 33563744} {"current_steps": 26505, "total_steps": 40000, "loss": 0.0586, "lr": 0.07666570198731526, "epoch": 1.2950675494100115, "percentage": 66.26, "elapsed_time": "1 day, 4:02:04", "remaining_time": "14:16:25", "throughput": 332.63, "total_tokens": 33569984} {"current_steps": 26510, "total_steps": 40000, "loss": 0.0537, "lr": 0.07661432243077708, "epoch": 1.2953118510737058, "percentage": 66.27, "elapsed_time": "1 day, 4:02:07", "remaining_time": "14:15:58", "throughput": 332.69, "total_tokens": 33577280} {"current_steps": 26515, "total_steps": 40000, "loss": 0.0378, "lr": 0.0765629541912326, "epoch": 1.2955561527374002, "percentage": 66.29, "elapsed_time": "1 day, 4:02:10", "remaining_time": "14:15:31", "throughput": 332.74, "total_tokens": 33583392} {"current_steps": 26520, "total_steps": 40000, "loss": 0.067, "lr": 0.07651159727660352, "epoch": 1.2958004544010944, "percentage": 66.3, "elapsed_time": "1 day, 4:02:13", "remaining_time": "14:15:04", "throughput": 332.79, "total_tokens": 33589536} {"current_steps": 26525, "total_steps": 40000, "loss": 0.0459, "lr": 0.07646025169480959, "epoch": 1.2960447560647887, "percentage": 66.31, "elapsed_time": "1 day, 4:02:16", "remaining_time": "14:14:36", "throughput": 332.84, "total_tokens": 33595808} {"current_steps": 26530, "total_steps": 40000, "loss": 0.0802, "lr": 0.07640891745376908, "epoch": 1.2962890577284831, "percentage": 66.33, "elapsed_time": "1 day, 4:02:19", "remaining_time": "14:14:09", "throughput": 332.89, "total_tokens": 33601792} {"current_steps": 26535, "total_steps": 40000, "loss": 0.0851, "lr": 0.07635759456139822, "epoch": 1.2965333593921775, "percentage": 66.34, "elapsed_time": "1 day, 4:02:22", "remaining_time": "14:13:42", "throughput": 332.94, "total_tokens": 33607776} {"current_steps": 26540, "total_steps": 40000, "loss": 0.0551, "lr": 0.0763062830256118, "epoch": 1.2967776610558719, "percentage": 66.35, "elapsed_time": "1 day, 4:02:25", "remaining_time": "14:13:15", "throughput": 333.0, "total_tokens": 33614496} {"current_steps": 26545, "total_steps": 40000, "loss": 0.0477, "lr": 0.07625498285432258, "epoch": 1.297021962719566, "percentage": 66.36, "elapsed_time": "1 day, 4:02:28", "remaining_time": "14:12:48", "throughput": 333.05, "total_tokens": 33621184} {"current_steps": 26550, "total_steps": 40000, "loss": 0.0731, "lr": 0.07620369405544176, "epoch": 1.2972662643832604, "percentage": 66.38, "elapsed_time": "1 day, 4:02:32", "remaining_time": "14:12:21", "throughput": 333.11, "total_tokens": 33627808} {"current_steps": 26555, "total_steps": 40000, "loss": 0.0692, "lr": 0.07615241663687868, "epoch": 1.2975105660469548, "percentage": 66.39, "elapsed_time": "1 day, 4:02:35", "remaining_time": "14:11:54", "throughput": 333.16, "total_tokens": 33634304} {"current_steps": 26560, "total_steps": 40000, "loss": 0.0458, "lr": 0.07610115060654106, "epoch": 1.2977548677106492, "percentage": 66.4, "elapsed_time": "1 day, 4:02:38", "remaining_time": "14:11:27", "throughput": 333.22, "total_tokens": 33640896} {"current_steps": 26565, "total_steps": 40000, "loss": 0.0438, "lr": 0.07604989597233458, "epoch": 1.2979991693743433, "percentage": 66.41, "elapsed_time": "1 day, 4:02:41", "remaining_time": "14:11:00", "throughput": 333.28, "total_tokens": 33647968} {"current_steps": 26570, "total_steps": 40000, "loss": 0.0596, "lr": 0.07599865274216352, "epoch": 1.2982434710380377, "percentage": 66.42, "elapsed_time": "1 day, 4:02:44", "remaining_time": "14:10:33", "throughput": 333.33, "total_tokens": 33654816} {"current_steps": 26575, "total_steps": 40000, "loss": 0.0551, "lr": 0.07594742092393013, "epoch": 1.298487772701732, "percentage": 66.44, "elapsed_time": "1 day, 4:02:47", "remaining_time": "14:10:06", "throughput": 333.39, "total_tokens": 33661472} {"current_steps": 26580, "total_steps": 40000, "loss": 0.0724, "lr": 0.07589620052553503, "epoch": 1.2987320743654265, "percentage": 66.45, "elapsed_time": "1 day, 4:02:50", "remaining_time": "14:09:39", "throughput": 333.44, "total_tokens": 33667520} {"current_steps": 26585, "total_steps": 40000, "loss": 0.0573, "lr": 0.0758449915548771, "epoch": 1.2989763760291209, "percentage": 66.46, "elapsed_time": "1 day, 4:02:53", "remaining_time": "14:09:12", "throughput": 333.49, "total_tokens": 33673440} {"current_steps": 26590, "total_steps": 40000, "loss": 0.0604, "lr": 0.07579379401985332, "epoch": 1.299220677692815, "percentage": 66.47, "elapsed_time": "1 day, 4:02:56", "remaining_time": "14:08:45", "throughput": 333.53, "total_tokens": 33679200} {"current_steps": 26595, "total_steps": 40000, "loss": 0.0813, "lr": 0.07574260792835905, "epoch": 1.2994649793565094, "percentage": 66.49, "elapsed_time": "1 day, 4:02:59", "remaining_time": "14:08:18", "throughput": 333.58, "total_tokens": 33685120} {"current_steps": 26600, "total_steps": 40000, "loss": 0.0787, "lr": 0.07569143328828784, "epoch": 1.2997092810202038, "percentage": 66.5, "elapsed_time": "1 day, 4:03:02", "remaining_time": "14:07:51", "throughput": 333.63, "total_tokens": 33691232} {"current_steps": 26600, "total_steps": 40000, "eval_loss": 0.06483670324087143, "epoch": 1.2997092810202038, "percentage": 66.5, "elapsed_time": "1 day, 4:13:43", "remaining_time": "14:13:13", "throughput": 331.53, "total_tokens": 33691232} {"current_steps": 26605, "total_steps": 40000, "loss": 0.0793, "lr": 0.0756402701075314, "epoch": 1.2999535826838982, "percentage": 66.51, "elapsed_time": "1 day, 4:13:46", "remaining_time": "14:12:46", "throughput": 331.58, "total_tokens": 33697280} {"current_steps": 26610, "total_steps": 40000, "loss": 0.0855, "lr": 0.07558911839397982, "epoch": 1.3001978843475923, "percentage": 66.53, "elapsed_time": "1 day, 4:13:49", "remaining_time": "14:12:19", "throughput": 331.63, "total_tokens": 33703424} {"current_steps": 26615, "total_steps": 40000, "loss": 0.0421, "lr": 0.07553797815552123, "epoch": 1.3004421860112867, "percentage": 66.54, "elapsed_time": "1 day, 4:13:52", "remaining_time": "14:11:52", "throughput": 331.68, "total_tokens": 33709568} {"current_steps": 26620, "total_steps": 40000, "loss": 0.0517, "lr": 0.07548684940004222, "epoch": 1.300686487674981, "percentage": 66.55, "elapsed_time": "1 day, 4:13:55", "remaining_time": "14:11:25", "throughput": 331.73, "total_tokens": 33715680} {"current_steps": 26625, "total_steps": 40000, "loss": 0.0758, "lr": 0.07543573213542744, "epoch": 1.3009307893386755, "percentage": 66.56, "elapsed_time": "1 day, 4:13:58", "remaining_time": "14:10:58", "throughput": 331.78, "total_tokens": 33721760} {"current_steps": 26630, "total_steps": 40000, "loss": 0.0357, "lr": 0.0753846263695597, "epoch": 1.3011750910023698, "percentage": 66.57, "elapsed_time": "1 day, 4:14:01", "remaining_time": "14:10:30", "throughput": 331.83, "total_tokens": 33728320} {"current_steps": 26635, "total_steps": 40000, "loss": 0.0472, "lr": 0.07533353211032029, "epoch": 1.301419392666064, "percentage": 66.59, "elapsed_time": "1 day, 4:14:05", "remaining_time": "14:10:03", "throughput": 331.89, "total_tokens": 33735008} {"current_steps": 26640, "total_steps": 40000, "loss": 0.058, "lr": 0.07528244936558857, "epoch": 1.3016636943297584, "percentage": 66.6, "elapsed_time": "1 day, 4:14:08", "remaining_time": "14:09:36", "throughput": 331.94, "total_tokens": 33741472} {"current_steps": 26645, "total_steps": 40000, "loss": 0.0517, "lr": 0.07523137814324206, "epoch": 1.3019079959934527, "percentage": 66.61, "elapsed_time": "1 day, 4:14:11", "remaining_time": "14:09:09", "throughput": 331.99, "total_tokens": 33747648} {"current_steps": 26650, "total_steps": 40000, "loss": 0.0594, "lr": 0.07518031845115672, "epoch": 1.302152297657147, "percentage": 66.62, "elapsed_time": "1 day, 4:14:14", "remaining_time": "14:08:42", "throughput": 332.05, "total_tokens": 33754016} {"current_steps": 26655, "total_steps": 40000, "loss": 0.0401, "lr": 0.07512927029720647, "epoch": 1.3023965993208413, "percentage": 66.64, "elapsed_time": "1 day, 4:14:17", "remaining_time": "14:08:15", "throughput": 332.11, "total_tokens": 33761344} {"current_steps": 26660, "total_steps": 40000, "loss": 0.0568, "lr": 0.0750782336892636, "epoch": 1.3026409009845357, "percentage": 66.65, "elapsed_time": "1 day, 4:14:20", "remaining_time": "14:07:48", "throughput": 332.16, "total_tokens": 33767456} {"current_steps": 26665, "total_steps": 40000, "loss": 0.078, "lr": 0.0750272086351987, "epoch": 1.30288520264823, "percentage": 66.66, "elapsed_time": "1 day, 4:14:23", "remaining_time": "14:07:21", "throughput": 332.21, "total_tokens": 33773440} {"current_steps": 26670, "total_steps": 40000, "loss": 0.0879, "lr": 0.07497619514288031, "epoch": 1.3031295043119244, "percentage": 66.67, "elapsed_time": "1 day, 4:14:26", "remaining_time": "14:06:54", "throughput": 332.26, "total_tokens": 33779744} {"current_steps": 26675, "total_steps": 40000, "loss": 0.0616, "lr": 0.07492519322017545, "epoch": 1.3033738059756188, "percentage": 66.69, "elapsed_time": "1 day, 4:14:30", "remaining_time": "14:06:27", "throughput": 332.31, "total_tokens": 33785952} {"current_steps": 26680, "total_steps": 40000, "loss": 0.0467, "lr": 0.0748742028749493, "epoch": 1.303618107639313, "percentage": 66.7, "elapsed_time": "1 day, 4:14:33", "remaining_time": "14:06:00", "throughput": 332.36, "total_tokens": 33792512} {"current_steps": 26685, "total_steps": 40000, "loss": 0.0486, "lr": 0.0748232241150651, "epoch": 1.3038624093030073, "percentage": 66.71, "elapsed_time": "1 day, 4:14:36", "remaining_time": "14:05:33", "throughput": 332.42, "total_tokens": 33799328} {"current_steps": 26690, "total_steps": 40000, "loss": 0.0517, "lr": 0.07477225694838453, "epoch": 1.3041067109667017, "percentage": 66.72, "elapsed_time": "1 day, 4:14:39", "remaining_time": "14:05:06", "throughput": 332.47, "total_tokens": 33805600} {"current_steps": 26695, "total_steps": 40000, "loss": 0.0536, "lr": 0.07472130138276731, "epoch": 1.3043510126303959, "percentage": 66.74, "elapsed_time": "1 day, 4:14:42", "remaining_time": "14:04:39", "throughput": 332.52, "total_tokens": 33811712} {"current_steps": 26700, "total_steps": 40000, "loss": 0.069, "lr": 0.07467035742607138, "epoch": 1.3045953142940903, "percentage": 66.75, "elapsed_time": "1 day, 4:14:45", "remaining_time": "14:04:12", "throughput": 332.58, "total_tokens": 33818304} {"current_steps": 26705, "total_steps": 40000, "loss": 0.1092, "lr": 0.07461942508615303, "epoch": 1.3048396159577846, "percentage": 66.76, "elapsed_time": "1 day, 4:14:48", "remaining_time": "14:03:45", "throughput": 332.63, "total_tokens": 33824480} {"current_steps": 26710, "total_steps": 40000, "loss": 0.0674, "lr": 0.07456850437086657, "epoch": 1.305083917621479, "percentage": 66.77, "elapsed_time": "1 day, 4:14:51", "remaining_time": "14:03:18", "throughput": 332.68, "total_tokens": 33830944} {"current_steps": 26715, "total_steps": 40000, "loss": 0.0602, "lr": 0.07451759528806468, "epoch": 1.3053282192851734, "percentage": 66.79, "elapsed_time": "1 day, 4:14:54", "remaining_time": "14:02:51", "throughput": 332.74, "total_tokens": 33837504} {"current_steps": 26720, "total_steps": 40000, "loss": 0.0643, "lr": 0.0744666978455982, "epoch": 1.3055725209488678, "percentage": 66.8, "elapsed_time": "1 day, 4:14:57", "remaining_time": "14:02:24", "throughput": 332.79, "total_tokens": 33843776} {"current_steps": 26725, "total_steps": 40000, "loss": 0.0693, "lr": 0.07441581205131609, "epoch": 1.305816822612562, "percentage": 66.81, "elapsed_time": "1 day, 4:15:01", "remaining_time": "14:01:57", "throughput": 332.84, "total_tokens": 33850304} {"current_steps": 26730, "total_steps": 40000, "loss": 0.0595, "lr": 0.07436493791306566, "epoch": 1.3060611242762563, "percentage": 66.83, "elapsed_time": "1 day, 4:15:04", "remaining_time": "14:01:30", "throughput": 332.89, "total_tokens": 33856512} {"current_steps": 26735, "total_steps": 40000, "loss": 0.0559, "lr": 0.07431407543869223, "epoch": 1.3063054259399507, "percentage": 66.84, "elapsed_time": "1 day, 4:15:07", "remaining_time": "14:01:03", "throughput": 332.95, "total_tokens": 33862912} {"current_steps": 26740, "total_steps": 40000, "loss": 0.0579, "lr": 0.0742632246360395, "epoch": 1.3065497276036449, "percentage": 66.85, "elapsed_time": "1 day, 4:15:10", "remaining_time": "14:00:36", "throughput": 333.0, "total_tokens": 33869664} {"current_steps": 26745, "total_steps": 40000, "loss": 0.0633, "lr": 0.07421238551294934, "epoch": 1.3067940292673392, "percentage": 66.86, "elapsed_time": "1 day, 4:15:13", "remaining_time": "14:00:09", "throughput": 333.05, "total_tokens": 33875744} {"current_steps": 26750, "total_steps": 40000, "loss": 0.0641, "lr": 0.07416155807726171, "epoch": 1.3070383309310336, "percentage": 66.88, "elapsed_time": "1 day, 4:15:16", "remaining_time": "13:59:42", "throughput": 333.1, "total_tokens": 33882240} {"current_steps": 26755, "total_steps": 40000, "loss": 0.0568, "lr": 0.07411074233681492, "epoch": 1.307282632594728, "percentage": 66.89, "elapsed_time": "1 day, 4:15:19", "remaining_time": "13:59:16", "throughput": 333.15, "total_tokens": 33888256} {"current_steps": 26760, "total_steps": 40000, "loss": 0.0858, "lr": 0.07405993829944528, "epoch": 1.3075269342584224, "percentage": 66.9, "elapsed_time": "1 day, 4:15:22", "remaining_time": "13:58:49", "throughput": 333.2, "total_tokens": 33894240} {"current_steps": 26765, "total_steps": 40000, "loss": 0.0361, "lr": 0.07400914597298755, "epoch": 1.3077712359221167, "percentage": 66.91, "elapsed_time": "1 day, 4:15:25", "remaining_time": "13:58:22", "throughput": 333.25, "total_tokens": 33900160} {"current_steps": 26770, "total_steps": 40000, "loss": 0.0761, "lr": 0.07395836536527445, "epoch": 1.308015537585811, "percentage": 66.92, "elapsed_time": "1 day, 4:15:28", "remaining_time": "13:57:55", "throughput": 333.3, "total_tokens": 33906560} {"current_steps": 26775, "total_steps": 40000, "loss": 0.0758, "lr": 0.07390759648413696, "epoch": 1.3082598392495053, "percentage": 66.94, "elapsed_time": "1 day, 4:15:31", "remaining_time": "13:57:28", "throughput": 333.36, "total_tokens": 33912800} {"current_steps": 26780, "total_steps": 40000, "loss": 0.0466, "lr": 0.07385683933740435, "epoch": 1.3085041409131997, "percentage": 66.95, "elapsed_time": "1 day, 4:15:34", "remaining_time": "13:57:01", "throughput": 333.41, "total_tokens": 33919200} {"current_steps": 26785, "total_steps": 40000, "loss": 0.0554, "lr": 0.07380609393290402, "epoch": 1.3087484425768938, "percentage": 66.96, "elapsed_time": "1 day, 4:15:37", "remaining_time": "13:56:34", "throughput": 333.46, "total_tokens": 33925600} {"current_steps": 26790, "total_steps": 40000, "loss": 0.0453, "lr": 0.07375536027846147, "epoch": 1.3089927442405882, "percentage": 66.97, "elapsed_time": "1 day, 4:15:41", "remaining_time": "13:56:07", "throughput": 333.51, "total_tokens": 33932096} {"current_steps": 26795, "total_steps": 40000, "loss": 0.0848, "lr": 0.07370463838190057, "epoch": 1.3092370459042826, "percentage": 66.99, "elapsed_time": "1 day, 4:15:44", "remaining_time": "13:55:41", "throughput": 333.57, "total_tokens": 33938400} {"current_steps": 26800, "total_steps": 40000, "loss": 0.0274, "lr": 0.07365392825104317, "epoch": 1.309481347567977, "percentage": 67.0, "elapsed_time": "1 day, 4:15:47", "remaining_time": "13:55:14", "throughput": 333.62, "total_tokens": 33944640} {"current_steps": 26800, "total_steps": 40000, "eval_loss": 0.06267567723989487, "epoch": 1.309481347567977, "percentage": 67.0, "elapsed_time": "1 day, 4:26:27", "remaining_time": "14:00:29", "throughput": 331.53, "total_tokens": 33944640} {"current_steps": 26805, "total_steps": 40000, "loss": 0.0795, "lr": 0.07360322989370945, "epoch": 1.3097256492316713, "percentage": 67.01, "elapsed_time": "1 day, 4:26:31", "remaining_time": "14:00:03", "throughput": 331.58, "total_tokens": 33950976} {"current_steps": 26810, "total_steps": 40000, "loss": 0.0491, "lr": 0.07355254331771781, "epoch": 1.3099699508953657, "percentage": 67.03, "elapsed_time": "1 day, 4:26:34", "remaining_time": "13:59:36", "throughput": 331.63, "total_tokens": 33957120} {"current_steps": 26815, "total_steps": 40000, "loss": 0.0491, "lr": 0.07350186853088461, "epoch": 1.3102142525590599, "percentage": 67.04, "elapsed_time": "1 day, 4:26:37", "remaining_time": "13:59:09", "throughput": 331.68, "total_tokens": 33963328} {"current_steps": 26820, "total_steps": 40000, "loss": 0.0687, "lr": 0.07345120554102462, "epoch": 1.3104585542227543, "percentage": 67.05, "elapsed_time": "1 day, 4:26:40", "remaining_time": "13:58:42", "throughput": 331.73, "total_tokens": 33969600} {"current_steps": 26825, "total_steps": 40000, "loss": 0.0469, "lr": 0.07340055435595079, "epoch": 1.3107028558864486, "percentage": 67.06, "elapsed_time": "1 day, 4:26:43", "remaining_time": "13:58:15", "throughput": 331.79, "total_tokens": 33976032} {"current_steps": 26830, "total_steps": 40000, "loss": 0.036, "lr": 0.07334991498347401, "epoch": 1.3109471575501428, "percentage": 67.07, "elapsed_time": "1 day, 4:26:46", "remaining_time": "13:57:48", "throughput": 331.83, "total_tokens": 33982016} {"current_steps": 26835, "total_steps": 40000, "loss": 0.0606, "lr": 0.07329928743140365, "epoch": 1.3111914592138372, "percentage": 67.09, "elapsed_time": "1 day, 4:26:49", "remaining_time": "13:57:21", "throughput": 331.88, "total_tokens": 33988096} {"current_steps": 26840, "total_steps": 40000, "loss": 0.0336, "lr": 0.07324867170754705, "epoch": 1.3114357608775316, "percentage": 67.1, "elapsed_time": "1 day, 4:26:52", "remaining_time": "13:56:54", "throughput": 331.93, "total_tokens": 33993920} {"current_steps": 26845, "total_steps": 40000, "loss": 0.0449, "lr": 0.07319806781970974, "epoch": 1.311680062541226, "percentage": 67.11, "elapsed_time": "1 day, 4:26:55", "remaining_time": "13:56:27", "throughput": 331.98, "total_tokens": 33999616} {"current_steps": 26850, "total_steps": 40000, "loss": 0.0446, "lr": 0.07314747577569555, "epoch": 1.3119243642049203, "percentage": 67.12, "elapsed_time": "1 day, 4:26:58", "remaining_time": "13:56:00", "throughput": 332.03, "total_tokens": 34006272} {"current_steps": 26855, "total_steps": 40000, "loss": 0.0897, "lr": 0.07309689558330636, "epoch": 1.3121686658686147, "percentage": 67.14, "elapsed_time": "1 day, 4:27:01", "remaining_time": "13:55:33", "throughput": 332.08, "total_tokens": 34012256} {"current_steps": 26860, "total_steps": 40000, "loss": 0.0479, "lr": 0.0730463272503423, "epoch": 1.3124129675323088, "percentage": 67.15, "elapsed_time": "1 day, 4:27:05", "remaining_time": "13:55:06", "throughput": 332.14, "total_tokens": 34019584} {"current_steps": 26865, "total_steps": 40000, "loss": 0.0417, "lr": 0.07299577078460168, "epoch": 1.3126572691960032, "percentage": 67.16, "elapsed_time": "1 day, 4:27:07", "remaining_time": "13:54:39", "throughput": 332.19, "total_tokens": 34025216} {"current_steps": 26870, "total_steps": 40000, "loss": 0.0479, "lr": 0.07294522619388083, "epoch": 1.3129015708596976, "percentage": 67.17, "elapsed_time": "1 day, 4:27:11", "remaining_time": "13:54:12", "throughput": 332.24, "total_tokens": 34032000} {"current_steps": 26875, "total_steps": 40000, "loss": 0.0548, "lr": 0.07289469348597452, "epoch": 1.3131458725233918, "percentage": 67.19, "elapsed_time": "1 day, 4:27:14", "remaining_time": "13:53:46", "throughput": 332.3, "total_tokens": 34039104} {"current_steps": 26880, "total_steps": 40000, "loss": 0.049, "lr": 0.07284417266867535, "epoch": 1.3133901741870861, "percentage": 67.2, "elapsed_time": "1 day, 4:27:17", "remaining_time": "13:53:19", "throughput": 332.35, "total_tokens": 34045120} {"current_steps": 26885, "total_steps": 40000, "loss": 0.0641, "lr": 0.07279366374977439, "epoch": 1.3136344758507805, "percentage": 67.21, "elapsed_time": "1 day, 4:27:20", "remaining_time": "13:52:52", "throughput": 332.4, "total_tokens": 34050656} {"current_steps": 26890, "total_steps": 40000, "loss": 0.0514, "lr": 0.07274316673706074, "epoch": 1.313878777514475, "percentage": 67.22, "elapsed_time": "1 day, 4:27:23", "remaining_time": "13:52:25", "throughput": 332.45, "total_tokens": 34057088} {"current_steps": 26895, "total_steps": 40000, "loss": 0.1021, "lr": 0.07269268163832161, "epoch": 1.3141230791781693, "percentage": 67.24, "elapsed_time": "1 day, 4:27:26", "remaining_time": "13:51:58", "throughput": 332.5, "total_tokens": 34062976} {"current_steps": 26900, "total_steps": 40000, "loss": 0.0813, "lr": 0.07264220846134248, "epoch": 1.3143673808418637, "percentage": 67.25, "elapsed_time": "1 day, 4:27:29", "remaining_time": "13:51:31", "throughput": 332.54, "total_tokens": 34068896} {"current_steps": 26905, "total_steps": 40000, "loss": 0.0574, "lr": 0.07259174721390699, "epoch": 1.3146116825055578, "percentage": 67.26, "elapsed_time": "1 day, 4:27:32", "remaining_time": "13:51:04", "throughput": 332.6, "total_tokens": 34075616} {"current_steps": 26910, "total_steps": 40000, "loss": 0.1029, "lr": 0.07254129790379686, "epoch": 1.3148559841692522, "percentage": 67.27, "elapsed_time": "1 day, 4:27:35", "remaining_time": "13:50:38", "throughput": 332.65, "total_tokens": 34081760} {"current_steps": 26915, "total_steps": 40000, "loss": 0.0521, "lr": 0.072490860538792, "epoch": 1.3151002858329466, "percentage": 67.29, "elapsed_time": "1 day, 4:27:38", "remaining_time": "13:50:11", "throughput": 332.7, "total_tokens": 34087840} {"current_steps": 26920, "total_steps": 40000, "loss": 0.0471, "lr": 0.07244043512667042, "epoch": 1.3153445874966407, "percentage": 67.3, "elapsed_time": "1 day, 4:27:41", "remaining_time": "13:49:44", "throughput": 332.75, "total_tokens": 34093760} {"current_steps": 26925, "total_steps": 40000, "loss": 0.0591, "lr": 0.07239002167520843, "epoch": 1.3155888891603351, "percentage": 67.31, "elapsed_time": "1 day, 4:27:44", "remaining_time": "13:49:17", "throughput": 332.8, "total_tokens": 34100288} {"current_steps": 26930, "total_steps": 40000, "loss": 0.037, "lr": 0.07233962019218045, "epoch": 1.3158331908240295, "percentage": 67.33, "elapsed_time": "1 day, 4:27:47", "remaining_time": "13:48:51", "throughput": 332.85, "total_tokens": 34106656} {"current_steps": 26935, "total_steps": 40000, "loss": 0.0704, "lr": 0.07228923068535892, "epoch": 1.3160774924877239, "percentage": 67.34, "elapsed_time": "1 day, 4:27:51", "remaining_time": "13:48:24", "throughput": 332.9, "total_tokens": 34113024} {"current_steps": 26940, "total_steps": 40000, "loss": 0.0392, "lr": 0.0722388531625146, "epoch": 1.3163217941514183, "percentage": 67.35, "elapsed_time": "1 day, 4:27:54", "remaining_time": "13:47:57", "throughput": 332.96, "total_tokens": 34119744} {"current_steps": 26945, "total_steps": 40000, "loss": 0.0552, "lr": 0.07218848763141639, "epoch": 1.3165660958151126, "percentage": 67.36, "elapsed_time": "1 day, 4:27:57", "remaining_time": "13:47:30", "throughput": 333.01, "total_tokens": 34126048} {"current_steps": 26950, "total_steps": 40000, "loss": 0.0667, "lr": 0.07213813409983118, "epoch": 1.3168103974788068, "percentage": 67.38, "elapsed_time": "1 day, 4:28:00", "remaining_time": "13:47:04", "throughput": 333.06, "total_tokens": 34131776} {"current_steps": 26955, "total_steps": 40000, "loss": 0.0448, "lr": 0.0720877925755242, "epoch": 1.3170546991425012, "percentage": 67.39, "elapsed_time": "1 day, 4:28:03", "remaining_time": "13:46:37", "throughput": 333.11, "total_tokens": 34137792} {"current_steps": 26960, "total_steps": 40000, "loss": 0.0573, "lr": 0.07203746306625866, "epoch": 1.3172990008061956, "percentage": 67.4, "elapsed_time": "1 day, 4:28:06", "remaining_time": "13:46:10", "throughput": 333.15, "total_tokens": 34143744} {"current_steps": 26965, "total_steps": 40000, "loss": 0.089, "lr": 0.07198714557979606, "epoch": 1.3175433024698897, "percentage": 67.41, "elapsed_time": "1 day, 4:28:09", "remaining_time": "13:45:43", "throughput": 333.21, "total_tokens": 34149984} {"current_steps": 26970, "total_steps": 40000, "loss": 0.0714, "lr": 0.07193684012389602, "epoch": 1.317787604133584, "percentage": 67.42, "elapsed_time": "1 day, 4:28:12", "remaining_time": "13:45:17", "throughput": 333.26, "total_tokens": 34156352} {"current_steps": 26975, "total_steps": 40000, "loss": 0.0757, "lr": 0.07188654670631621, "epoch": 1.3180319057972785, "percentage": 67.44, "elapsed_time": "1 day, 4:28:15", "remaining_time": "13:44:50", "throughput": 333.31, "total_tokens": 34162432} {"current_steps": 26980, "total_steps": 40000, "loss": 0.0634, "lr": 0.07183626533481258, "epoch": 1.3182762074609728, "percentage": 67.45, "elapsed_time": "1 day, 4:28:18", "remaining_time": "13:44:23", "throughput": 333.35, "total_tokens": 34168256} {"current_steps": 26985, "total_steps": 40000, "loss": 0.0528, "lr": 0.07178599601713909, "epoch": 1.3185205091246672, "percentage": 67.46, "elapsed_time": "1 day, 4:28:21", "remaining_time": "13:43:56", "throughput": 333.41, "total_tokens": 34174592} {"current_steps": 26990, "total_steps": 40000, "loss": 0.0938, "lr": 0.07173573876104786, "epoch": 1.3187648107883614, "percentage": 67.47, "elapsed_time": "1 day, 4:28:24", "remaining_time": "13:43:30", "throughput": 333.46, "total_tokens": 34181152} {"current_steps": 26995, "total_steps": 40000, "loss": 0.0422, "lr": 0.0716854935742893, "epoch": 1.3190091124520558, "percentage": 67.49, "elapsed_time": "1 day, 4:28:27", "remaining_time": "13:43:03", "throughput": 333.51, "total_tokens": 34187104} {"current_steps": 27000, "total_steps": 40000, "loss": 0.0781, "lr": 0.07163526046461174, "epoch": 1.3192534141157501, "percentage": 67.5, "elapsed_time": "1 day, 4:28:30", "remaining_time": "13:42:37", "throughput": 333.56, "total_tokens": 34193536} {"current_steps": 27000, "total_steps": 40000, "eval_loss": 0.06449524313211441, "epoch": 1.3192534141157501, "percentage": 67.5, "elapsed_time": "1 day, 4:39:10", "remaining_time": "13:47:45", "throughput": 331.49, "total_tokens": 34193536} {"current_steps": 27005, "total_steps": 40000, "loss": 0.0585, "lr": 0.07158503943976181, "epoch": 1.3194977157794445, "percentage": 67.51, "elapsed_time": "1 day, 4:39:14", "remaining_time": "13:47:18", "throughput": 331.54, "total_tokens": 34199392} {"current_steps": 27010, "total_steps": 40000, "loss": 0.0678, "lr": 0.07153483050748427, "epoch": 1.3197420174431387, "percentage": 67.53, "elapsed_time": "1 day, 4:39:17", "remaining_time": "13:46:51", "throughput": 331.59, "total_tokens": 34205792} {"current_steps": 27015, "total_steps": 40000, "loss": 0.0585, "lr": 0.07148463367552188, "epoch": 1.319986319106833, "percentage": 67.54, "elapsed_time": "1 day, 4:39:20", "remaining_time": "13:46:25", "throughput": 331.64, "total_tokens": 34212288} {"current_steps": 27020, "total_steps": 40000, "loss": 0.0385, "lr": 0.07143444895161565, "epoch": 1.3202306207705274, "percentage": 67.55, "elapsed_time": "1 day, 4:39:23", "remaining_time": "13:45:58", "throughput": 331.69, "total_tokens": 34218592} {"current_steps": 27025, "total_steps": 40000, "loss": 0.0644, "lr": 0.07138427634350476, "epoch": 1.3204749224342218, "percentage": 67.56, "elapsed_time": "1 day, 4:39:26", "remaining_time": "13:45:31", "throughput": 331.74, "total_tokens": 34225056} {"current_steps": 27030, "total_steps": 40000, "loss": 0.0541, "lr": 0.07133411585892636, "epoch": 1.3207192240979162, "percentage": 67.58, "elapsed_time": "1 day, 4:39:30", "remaining_time": "13:45:04", "throughput": 331.8, "total_tokens": 34231584} {"current_steps": 27035, "total_steps": 40000, "loss": 0.0602, "lr": 0.07128396750561593, "epoch": 1.3209635257616104, "percentage": 67.59, "elapsed_time": "1 day, 4:39:33", "remaining_time": "13:44:38", "throughput": 331.85, "total_tokens": 34237952} {"current_steps": 27040, "total_steps": 40000, "loss": 0.0681, "lr": 0.07123383129130685, "epoch": 1.3212078274253047, "percentage": 67.6, "elapsed_time": "1 day, 4:39:36", "remaining_time": "13:44:11", "throughput": 331.9, "total_tokens": 34244416} {"current_steps": 27045, "total_steps": 40000, "loss": 0.0362, "lr": 0.07118370722373084, "epoch": 1.3214521290889991, "percentage": 67.61, "elapsed_time": "1 day, 4:39:39", "remaining_time": "13:43:44", "throughput": 331.96, "total_tokens": 34250976} {"current_steps": 27050, "total_steps": 40000, "loss": 0.0357, "lr": 0.07113359531061769, "epoch": 1.3216964307526935, "percentage": 67.62, "elapsed_time": "1 day, 4:39:42", "remaining_time": "13:43:18", "throughput": 332.01, "total_tokens": 34258016} {"current_steps": 27055, "total_steps": 40000, "loss": 0.0497, "lr": 0.07108349555969525, "epoch": 1.3219407324163877, "percentage": 67.64, "elapsed_time": "1 day, 4:39:45", "remaining_time": "13:42:51", "throughput": 332.06, "total_tokens": 34264256} {"current_steps": 27060, "total_steps": 40000, "loss": 0.0541, "lr": 0.07103340797868944, "epoch": 1.322185034080082, "percentage": 67.65, "elapsed_time": "1 day, 4:39:48", "remaining_time": "13:42:24", "throughput": 332.11, "total_tokens": 34270304} {"current_steps": 27065, "total_steps": 40000, "loss": 0.0832, "lr": 0.07098333257532453, "epoch": 1.3224293357437764, "percentage": 67.66, "elapsed_time": "1 day, 4:39:51", "remaining_time": "13:41:57", "throughput": 332.16, "total_tokens": 34276672} {"current_steps": 27070, "total_steps": 40000, "loss": 0.069, "lr": 0.07093326935732269, "epoch": 1.3226736374074708, "percentage": 67.67, "elapsed_time": "1 day, 4:39:54", "remaining_time": "13:41:31", "throughput": 332.21, "total_tokens": 34282496} {"current_steps": 27075, "total_steps": 40000, "loss": 0.0625, "lr": 0.0708832183324044, "epoch": 1.3229179390711652, "percentage": 67.69, "elapsed_time": "1 day, 4:39:57", "remaining_time": "13:41:04", "throughput": 332.26, "total_tokens": 34288800} {"current_steps": 27080, "total_steps": 40000, "loss": 0.0553, "lr": 0.07083317950828799, "epoch": 1.3231622407348593, "percentage": 67.7, "elapsed_time": "1 day, 4:40:01", "remaining_time": "13:40:37", "throughput": 332.31, "total_tokens": 34295232} {"current_steps": 27085, "total_steps": 40000, "loss": 0.0924, "lr": 0.0707831528926902, "epoch": 1.3234065423985537, "percentage": 67.71, "elapsed_time": "1 day, 4:40:04", "remaining_time": "13:40:11", "throughput": 332.36, "total_tokens": 34301120} {"current_steps": 27090, "total_steps": 40000, "loss": 0.0463, "lr": 0.07073313849332578, "epoch": 1.323650844062248, "percentage": 67.73, "elapsed_time": "1 day, 4:40:07", "remaining_time": "13:39:44", "throughput": 332.41, "total_tokens": 34307328} {"current_steps": 27095, "total_steps": 40000, "loss": 0.0556, "lr": 0.07068313631790749, "epoch": 1.3238951457259425, "percentage": 67.74, "elapsed_time": "1 day, 4:40:10", "remaining_time": "13:39:17", "throughput": 332.47, "total_tokens": 34314432} {"current_steps": 27100, "total_steps": 40000, "loss": 0.0933, "lr": 0.07063314637414632, "epoch": 1.3241394473896366, "percentage": 67.75, "elapsed_time": "1 day, 4:40:13", "remaining_time": "13:38:51", "throughput": 332.52, "total_tokens": 34320608} {"current_steps": 27105, "total_steps": 40000, "loss": 0.0568, "lr": 0.07058316866975144, "epoch": 1.324383749053331, "percentage": 67.76, "elapsed_time": "1 day, 4:40:16", "remaining_time": "13:38:24", "throughput": 332.57, "total_tokens": 34326912} {"current_steps": 27110, "total_steps": 40000, "loss": 0.0384, "lr": 0.0705332032124299, "epoch": 1.3246280507170254, "percentage": 67.77, "elapsed_time": "1 day, 4:40:19", "remaining_time": "13:37:57", "throughput": 332.62, "total_tokens": 34332960} {"current_steps": 27115, "total_steps": 40000, "loss": 0.0488, "lr": 0.0704832500098871, "epoch": 1.3248723523807198, "percentage": 67.79, "elapsed_time": "1 day, 4:40:22", "remaining_time": "13:37:31", "throughput": 332.67, "total_tokens": 34339392} {"current_steps": 27120, "total_steps": 40000, "loss": 0.0558, "lr": 0.07043330906982641, "epoch": 1.3251166540444141, "percentage": 67.8, "elapsed_time": "1 day, 4:40:25", "remaining_time": "13:37:04", "throughput": 332.72, "total_tokens": 34345184} {"current_steps": 27125, "total_steps": 40000, "loss": 0.0758, "lr": 0.07038338039994936, "epoch": 1.3253609557081083, "percentage": 67.81, "elapsed_time": "1 day, 4:40:28", "remaining_time": "13:36:38", "throughput": 332.77, "total_tokens": 34351520} {"current_steps": 27130, "total_steps": 40000, "loss": 0.0338, "lr": 0.07033346400795562, "epoch": 1.3256052573718027, "percentage": 67.83, "elapsed_time": "1 day, 4:40:32", "remaining_time": "13:36:11", "throughput": 332.83, "total_tokens": 34358528} {"current_steps": 27135, "total_steps": 40000, "loss": 0.0659, "lr": 0.07028355990154282, "epoch": 1.325849559035497, "percentage": 67.84, "elapsed_time": "1 day, 4:40:35", "remaining_time": "13:35:44", "throughput": 332.87, "total_tokens": 34364320} {"current_steps": 27140, "total_steps": 40000, "loss": 0.0573, "lr": 0.07023366808840685, "epoch": 1.3260938606991914, "percentage": 67.85, "elapsed_time": "1 day, 4:40:38", "remaining_time": "13:35:18", "throughput": 332.93, "total_tokens": 34370624} {"current_steps": 27145, "total_steps": 40000, "loss": 0.0373, "lr": 0.07018378857624172, "epoch": 1.3263381623628856, "percentage": 67.86, "elapsed_time": "1 day, 4:40:41", "remaining_time": "13:34:51", "throughput": 332.98, "total_tokens": 34376832} {"current_steps": 27150, "total_steps": 40000, "loss": 0.0297, "lr": 0.0701339213727394, "epoch": 1.32658246402658, "percentage": 67.88, "elapsed_time": "1 day, 4:40:44", "remaining_time": "13:34:25", "throughput": 333.02, "total_tokens": 34382688} {"current_steps": 27155, "total_steps": 40000, "loss": 0.0483, "lr": 0.07008406648559008, "epoch": 1.3268267656902744, "percentage": 67.89, "elapsed_time": "1 day, 4:40:47", "remaining_time": "13:33:58", "throughput": 333.07, "total_tokens": 34388896} {"current_steps": 27160, "total_steps": 40000, "loss": 0.0576, "lr": 0.07003422392248196, "epoch": 1.3270710673539687, "percentage": 67.9, "elapsed_time": "1 day, 4:40:50", "remaining_time": "13:33:31", "throughput": 333.12, "total_tokens": 34394912} {"current_steps": 27165, "total_steps": 40000, "loss": 0.0592, "lr": 0.06998439369110142, "epoch": 1.3273153690176631, "percentage": 67.91, "elapsed_time": "1 day, 4:40:53", "remaining_time": "13:33:05", "throughput": 333.18, "total_tokens": 34401792} {"current_steps": 27170, "total_steps": 40000, "loss": 0.0575, "lr": 0.06993457579913295, "epoch": 1.3275596706813573, "percentage": 67.92, "elapsed_time": "1 day, 4:40:56", "remaining_time": "13:32:38", "throughput": 333.23, "total_tokens": 34408064} {"current_steps": 27175, "total_steps": 40000, "loss": 0.0404, "lr": 0.06988477025425903, "epoch": 1.3278039723450517, "percentage": 67.94, "elapsed_time": "1 day, 4:40:59", "remaining_time": "13:32:12", "throughput": 333.28, "total_tokens": 34414528} {"current_steps": 27180, "total_steps": 40000, "loss": 0.0342, "lr": 0.06983497706416032, "epoch": 1.328048274008746, "percentage": 67.95, "elapsed_time": "1 day, 4:41:02", "remaining_time": "13:31:45", "throughput": 333.33, "total_tokens": 34420896} {"current_steps": 27185, "total_steps": 40000, "loss": 0.0435, "lr": 0.0697851962365156, "epoch": 1.3282925756724404, "percentage": 67.96, "elapsed_time": "1 day, 4:41:05", "remaining_time": "13:31:19", "throughput": 333.38, "total_tokens": 34426976} {"current_steps": 27190, "total_steps": 40000, "loss": 0.0594, "lr": 0.06973542777900163, "epoch": 1.3285368773361346, "percentage": 67.97, "elapsed_time": "1 day, 4:41:08", "remaining_time": "13:30:52", "throughput": 333.43, "total_tokens": 34433440} {"current_steps": 27195, "total_steps": 40000, "loss": 0.0535, "lr": 0.06968567169929342, "epoch": 1.328781178999829, "percentage": 67.99, "elapsed_time": "1 day, 4:41:12", "remaining_time": "13:30:26", "throughput": 333.49, "total_tokens": 34439936} {"current_steps": 27200, "total_steps": 40000, "loss": 0.0356, "lr": 0.06963592800506392, "epoch": 1.3290254806635233, "percentage": 68.0, "elapsed_time": "1 day, 4:41:15", "remaining_time": "13:30:00", "throughput": 333.54, "total_tokens": 34445952} {"current_steps": 27200, "total_steps": 40000, "eval_loss": 0.06495053321123123, "epoch": 1.3290254806635233, "percentage": 68.0, "elapsed_time": "1 day, 4:51:55", "remaining_time": "13:35:01", "throughput": 331.48, "total_tokens": 34445952} {"current_steps": 27205, "total_steps": 40000, "loss": 0.0756, "lr": 0.06958619670398417, "epoch": 1.3292697823272177, "percentage": 68.01, "elapsed_time": "1 day, 4:51:59", "remaining_time": "13:34:35", "throughput": 331.53, "total_tokens": 34451968} {"current_steps": 27210, "total_steps": 40000, "loss": 0.0495, "lr": 0.0695364778037235, "epoch": 1.329514083990912, "percentage": 68.03, "elapsed_time": "1 day, 4:52:02", "remaining_time": "13:34:08", "throughput": 331.58, "total_tokens": 34458272} {"current_steps": 27215, "total_steps": 40000, "loss": 0.0995, "lr": 0.06948677131194907, "epoch": 1.3297583856546062, "percentage": 68.04, "elapsed_time": "1 day, 4:52:05", "remaining_time": "13:33:42", "throughput": 331.63, "total_tokens": 34465120} {"current_steps": 27220, "total_steps": 40000, "loss": 0.0783, "lr": 0.06943707723632629, "epoch": 1.3300026873183006, "percentage": 68.05, "elapsed_time": "1 day, 4:52:09", "remaining_time": "13:33:15", "throughput": 331.68, "total_tokens": 34471584} {"current_steps": 27225, "total_steps": 40000, "loss": 0.0868, "lr": 0.06938739558451867, "epoch": 1.330246988981995, "percentage": 68.06, "elapsed_time": "1 day, 4:52:12", "remaining_time": "13:32:48", "throughput": 331.73, "total_tokens": 34477696} {"current_steps": 27230, "total_steps": 40000, "loss": 0.0679, "lr": 0.06933772636418763, "epoch": 1.3304912906456892, "percentage": 68.08, "elapsed_time": "1 day, 4:52:15", "remaining_time": "13:32:22", "throughput": 331.78, "total_tokens": 34483808} {"current_steps": 27235, "total_steps": 40000, "loss": 0.0665, "lr": 0.06928806958299293, "epoch": 1.3307355923093835, "percentage": 68.09, "elapsed_time": "1 day, 4:52:18", "remaining_time": "13:31:55", "throughput": 331.83, "total_tokens": 34489568} {"current_steps": 27240, "total_steps": 40000, "loss": 0.055, "lr": 0.06923842524859211, "epoch": 1.330979893973078, "percentage": 68.1, "elapsed_time": "1 day, 4:52:21", "remaining_time": "13:31:29", "throughput": 331.88, "total_tokens": 34495488} {"current_steps": 27245, "total_steps": 40000, "loss": 0.057, "lr": 0.06918879336864105, "epoch": 1.3312241956367723, "percentage": 68.11, "elapsed_time": "1 day, 4:52:24", "remaining_time": "13:31:02", "throughput": 331.92, "total_tokens": 34501056} {"current_steps": 27250, "total_steps": 40000, "loss": 0.0865, "lr": 0.06913917395079362, "epoch": 1.3314684973004667, "percentage": 68.12, "elapsed_time": "1 day, 4:52:27", "remaining_time": "13:30:35", "throughput": 331.97, "total_tokens": 34507456} {"current_steps": 27255, "total_steps": 40000, "loss": 0.0656, "lr": 0.0690895670027017, "epoch": 1.331712798964161, "percentage": 68.14, "elapsed_time": "1 day, 4:52:30", "remaining_time": "13:30:09", "throughput": 332.02, "total_tokens": 34513696} {"current_steps": 27260, "total_steps": 40000, "loss": 0.0462, "lr": 0.06903997253201531, "epoch": 1.3319571006278552, "percentage": 68.15, "elapsed_time": "1 day, 4:52:33", "remaining_time": "13:29:42", "throughput": 332.07, "total_tokens": 34520128} {"current_steps": 27265, "total_steps": 40000, "loss": 0.0537, "lr": 0.06899039054638263, "epoch": 1.3322014022915496, "percentage": 68.16, "elapsed_time": "1 day, 4:52:36", "remaining_time": "13:29:16", "throughput": 332.12, "total_tokens": 34526400} {"current_steps": 27270, "total_steps": 40000, "loss": 0.0558, "lr": 0.06894082105344976, "epoch": 1.332445703955244, "percentage": 68.17, "elapsed_time": "1 day, 4:52:39", "remaining_time": "13:28:49", "throughput": 332.17, "total_tokens": 34532608} {"current_steps": 27275, "total_steps": 40000, "loss": 0.0605, "lr": 0.06889126406086087, "epoch": 1.3326900056189381, "percentage": 68.19, "elapsed_time": "1 day, 4:52:42", "remaining_time": "13:28:23", "throughput": 332.22, "total_tokens": 34538944} {"current_steps": 27280, "total_steps": 40000, "loss": 0.0471, "lr": 0.0688417195762584, "epoch": 1.3329343072826325, "percentage": 68.2, "elapsed_time": "1 day, 4:52:45", "remaining_time": "13:27:56", "throughput": 332.28, "total_tokens": 34545440} {"current_steps": 27285, "total_steps": 40000, "loss": 0.0448, "lr": 0.06879218760728262, "epoch": 1.333178608946327, "percentage": 68.21, "elapsed_time": "1 day, 4:52:48", "remaining_time": "13:27:30", "throughput": 332.33, "total_tokens": 34551840} {"current_steps": 27290, "total_steps": 40000, "loss": 0.0412, "lr": 0.06874266816157207, "epoch": 1.3334229106100213, "percentage": 68.23, "elapsed_time": "1 day, 4:52:51", "remaining_time": "13:27:03", "throughput": 332.38, "total_tokens": 34558048} {"current_steps": 27295, "total_steps": 40000, "loss": 0.073, "lr": 0.06869316124676321, "epoch": 1.3336672122737157, "percentage": 68.24, "elapsed_time": "1 day, 4:52:54", "remaining_time": "13:26:37", "throughput": 332.43, "total_tokens": 34564160} {"current_steps": 27300, "total_steps": 40000, "loss": 0.0278, "lr": 0.06864366687049062, "epoch": 1.33391151393741, "percentage": 68.25, "elapsed_time": "1 day, 4:52:58", "remaining_time": "13:26:10", "throughput": 332.48, "total_tokens": 34570720} {"current_steps": 27305, "total_steps": 40000, "loss": 0.0433, "lr": 0.06859418504038704, "epoch": 1.3341558156011042, "percentage": 68.26, "elapsed_time": "1 day, 4:53:01", "remaining_time": "13:25:44", "throughput": 332.54, "total_tokens": 34577632} {"current_steps": 27310, "total_steps": 40000, "loss": 0.0708, "lr": 0.06854471576408311, "epoch": 1.3344001172647986, "percentage": 68.27, "elapsed_time": "1 day, 4:53:04", "remaining_time": "13:25:17", "throughput": 332.59, "total_tokens": 34584160} {"current_steps": 27315, "total_steps": 40000, "loss": 0.0746, "lr": 0.06849525904920767, "epoch": 1.334644418928493, "percentage": 68.29, "elapsed_time": "1 day, 4:53:07", "remaining_time": "13:24:51", "throughput": 332.64, "total_tokens": 34590464} {"current_steps": 27320, "total_steps": 40000, "loss": 0.0469, "lr": 0.06844581490338748, "epoch": 1.334888720592187, "percentage": 68.3, "elapsed_time": "1 day, 4:53:10", "remaining_time": "13:24:25", "throughput": 332.69, "total_tokens": 34596800} {"current_steps": 27325, "total_steps": 40000, "loss": 0.0413, "lr": 0.06839638333424752, "epoch": 1.3351330222558815, "percentage": 68.31, "elapsed_time": "1 day, 4:53:13", "remaining_time": "13:23:58", "throughput": 332.74, "total_tokens": 34603360} {"current_steps": 27330, "total_steps": 40000, "loss": 0.063, "lr": 0.06834696434941082, "epoch": 1.3353773239195759, "percentage": 68.33, "elapsed_time": "1 day, 4:53:16", "remaining_time": "13:23:32", "throughput": 332.8, "total_tokens": 34609664} {"current_steps": 27335, "total_steps": 40000, "loss": 0.05, "lr": 0.06829755795649824, "epoch": 1.3356216255832702, "percentage": 68.34, "elapsed_time": "1 day, 4:53:20", "remaining_time": "13:23:05", "throughput": 332.85, "total_tokens": 34616320} {"current_steps": 27340, "total_steps": 40000, "loss": 0.0623, "lr": 0.06824816416312904, "epoch": 1.3358659272469646, "percentage": 68.35, "elapsed_time": "1 day, 4:53:23", "remaining_time": "13:22:39", "throughput": 332.9, "total_tokens": 34622336} {"current_steps": 27345, "total_steps": 40000, "loss": 0.0739, "lr": 0.06819878297692027, "epoch": 1.336110228910659, "percentage": 68.36, "elapsed_time": "1 day, 4:53:26", "remaining_time": "13:22:13", "throughput": 332.95, "total_tokens": 34628896} {"current_steps": 27350, "total_steps": 40000, "loss": 0.0669, "lr": 0.0681494144054871, "epoch": 1.3363545305743532, "percentage": 68.38, "elapsed_time": "1 day, 4:53:29", "remaining_time": "13:21:46", "throughput": 333.0, "total_tokens": 34635264} {"current_steps": 27355, "total_steps": 40000, "loss": 0.057, "lr": 0.06810005845644286, "epoch": 1.3365988322380475, "percentage": 68.39, "elapsed_time": "1 day, 4:53:32", "remaining_time": "13:21:20", "throughput": 333.05, "total_tokens": 34641536} {"current_steps": 27360, "total_steps": 40000, "loss": 0.0329, "lr": 0.06805071513739878, "epoch": 1.336843133901742, "percentage": 68.4, "elapsed_time": "1 day, 4:53:35", "remaining_time": "13:20:53", "throughput": 333.11, "total_tokens": 34648192} {"current_steps": 27365, "total_steps": 40000, "loss": 0.0427, "lr": 0.06800138445596428, "epoch": 1.337087435565436, "percentage": 68.41, "elapsed_time": "1 day, 4:53:38", "remaining_time": "13:20:27", "throughput": 333.16, "total_tokens": 34654304} {"current_steps": 27370, "total_steps": 40000, "loss": 0.0707, "lr": 0.06795206641974678, "epoch": 1.3373317372291305, "percentage": 68.42, "elapsed_time": "1 day, 4:53:41", "remaining_time": "13:20:01", "throughput": 333.2, "total_tokens": 34660288} {"current_steps": 27375, "total_steps": 40000, "loss": 0.0635, "lr": 0.06790276103635169, "epoch": 1.3375760388928248, "percentage": 68.44, "elapsed_time": "1 day, 4:53:44", "remaining_time": "13:19:34", "throughput": 333.26, "total_tokens": 34666880} {"current_steps": 27380, "total_steps": 40000, "loss": 0.0353, "lr": 0.0678534683133826, "epoch": 1.3378203405565192, "percentage": 68.45, "elapsed_time": "1 day, 4:53:47", "remaining_time": "13:19:08", "throughput": 333.31, "total_tokens": 34673152} {"current_steps": 27385, "total_steps": 40000, "loss": 0.0452, "lr": 0.06780418825844095, "epoch": 1.3380646422202136, "percentage": 68.46, "elapsed_time": "1 day, 4:53:50", "remaining_time": "13:18:42", "throughput": 333.36, "total_tokens": 34679904} {"current_steps": 27390, "total_steps": 40000, "loss": 0.0348, "lr": 0.0677549208791264, "epoch": 1.338308943883908, "percentage": 68.47, "elapsed_time": "1 day, 4:53:54", "remaining_time": "13:18:15", "throughput": 333.42, "total_tokens": 34686528} {"current_steps": 27395, "total_steps": 40000, "loss": 0.041, "lr": 0.06770566618303668, "epoch": 1.3385532455476021, "percentage": 68.49, "elapsed_time": "1 day, 4:53:57", "remaining_time": "13:17:49", "throughput": 333.47, "total_tokens": 34692800} {"current_steps": 27400, "total_steps": 40000, "loss": 0.044, "lr": 0.06765642417776736, "epoch": 1.3387975472112965, "percentage": 68.5, "elapsed_time": "1 day, 4:54:00", "remaining_time": "13:17:23", "throughput": 333.51, "total_tokens": 34698784} {"current_steps": 27400, "total_steps": 40000, "eval_loss": 0.06539439409971237, "epoch": 1.3387975472112965, "percentage": 68.5, "elapsed_time": "1 day, 5:04:40", "remaining_time": "13:22:17", "throughput": 331.47, "total_tokens": 34698784} {"current_steps": 27405, "total_steps": 40000, "loss": 0.0704, "lr": 0.0676071948709122, "epoch": 1.339041848874991, "percentage": 68.51, "elapsed_time": "1 day, 5:04:44", "remaining_time": "13:21:51", "throughput": 331.52, "total_tokens": 34705152} {"current_steps": 27410, "total_steps": 40000, "loss": 0.0469, "lr": 0.06755797827006307, "epoch": 1.339286150538685, "percentage": 68.53, "elapsed_time": "1 day, 5:04:47", "remaining_time": "13:21:25", "throughput": 331.57, "total_tokens": 34711488} {"current_steps": 27415, "total_steps": 40000, "loss": 0.046, "lr": 0.06750877438280974, "epoch": 1.3395304522023794, "percentage": 68.54, "elapsed_time": "1 day, 5:04:50", "remaining_time": "13:20:58", "throughput": 331.62, "total_tokens": 34717568} {"current_steps": 27420, "total_steps": 40000, "loss": 0.0477, "lr": 0.06745958321673998, "epoch": 1.3397747538660738, "percentage": 68.55, "elapsed_time": "1 day, 5:04:53", "remaining_time": "13:20:32", "throughput": 331.67, "total_tokens": 34723584} {"current_steps": 27425, "total_steps": 40000, "loss": 0.0494, "lr": 0.0674104047794398, "epoch": 1.3400190555297682, "percentage": 68.56, "elapsed_time": "1 day, 5:04:56", "remaining_time": "13:20:05", "throughput": 331.72, "total_tokens": 34729728} {"current_steps": 27430, "total_steps": 40000, "loss": 0.0463, "lr": 0.06736123907849303, "epoch": 1.3402633571934626, "percentage": 68.58, "elapsed_time": "1 day, 5:04:59", "remaining_time": "13:19:39", "throughput": 331.77, "total_tokens": 34735712} {"current_steps": 27435, "total_steps": 40000, "loss": 0.0445, "lr": 0.06731208612148178, "epoch": 1.340507658857157, "percentage": 68.59, "elapsed_time": "1 day, 5:05:02", "remaining_time": "13:19:12", "throughput": 331.82, "total_tokens": 34742112} {"current_steps": 27440, "total_steps": 40000, "loss": 0.063, "lr": 0.0672629459159859, "epoch": 1.340751960520851, "percentage": 68.6, "elapsed_time": "1 day, 5:05:05", "remaining_time": "13:18:46", "throughput": 331.87, "total_tokens": 34748160} {"current_steps": 27445, "total_steps": 40000, "loss": 0.0439, "lr": 0.0672138184695835, "epoch": 1.3409962621845455, "percentage": 68.61, "elapsed_time": "1 day, 5:05:08", "remaining_time": "13:18:20", "throughput": 331.92, "total_tokens": 34754720} {"current_steps": 27450, "total_steps": 40000, "loss": 0.0226, "lr": 0.0671647037898507, "epoch": 1.3412405638482399, "percentage": 68.62, "elapsed_time": "1 day, 5:05:11", "remaining_time": "13:17:53", "throughput": 331.98, "total_tokens": 34761696} {"current_steps": 27455, "total_steps": 40000, "loss": 0.0839, "lr": 0.0671156018843615, "epoch": 1.341484865511934, "percentage": 68.64, "elapsed_time": "1 day, 5:05:14", "remaining_time": "13:17:27", "throughput": 332.03, "total_tokens": 34767968} {"current_steps": 27460, "total_steps": 40000, "loss": 0.0775, "lr": 0.06706651276068812, "epoch": 1.3417291671756284, "percentage": 68.65, "elapsed_time": "1 day, 5:05:17", "remaining_time": "13:17:00", "throughput": 332.07, "total_tokens": 34774080} {"current_steps": 27465, "total_steps": 40000, "loss": 0.0531, "lr": 0.06701743642640064, "epoch": 1.3419734688393228, "percentage": 68.66, "elapsed_time": "1 day, 5:05:20", "remaining_time": "13:16:34", "throughput": 332.12, "total_tokens": 34779904} {"current_steps": 27470, "total_steps": 40000, "loss": 0.0662, "lr": 0.06696837288906729, "epoch": 1.3422177705030172, "percentage": 68.67, "elapsed_time": "1 day, 5:05:24", "remaining_time": "13:16:08", "throughput": 332.17, "total_tokens": 34786592} {"current_steps": 27475, "total_steps": 40000, "loss": 0.0496, "lr": 0.06691932215625432, "epoch": 1.3424620721667115, "percentage": 68.69, "elapsed_time": "1 day, 5:05:27", "remaining_time": "13:15:41", "throughput": 332.22, "total_tokens": 34792544} {"current_steps": 27480, "total_steps": 40000, "loss": 0.0548, "lr": 0.06687028423552589, "epoch": 1.342706373830406, "percentage": 68.7, "elapsed_time": "1 day, 5:05:30", "remaining_time": "13:15:15", "throughput": 332.27, "total_tokens": 34799008} {"current_steps": 27485, "total_steps": 40000, "loss": 0.0848, "lr": 0.06682125913444435, "epoch": 1.3429506754941, "percentage": 68.71, "elapsed_time": "1 day, 5:05:33", "remaining_time": "13:14:49", "throughput": 332.32, "total_tokens": 34805376} {"current_steps": 27490, "total_steps": 40000, "loss": 0.0527, "lr": 0.0667722468605699, "epoch": 1.3431949771577945, "percentage": 68.73, "elapsed_time": "1 day, 5:05:36", "remaining_time": "13:14:22", "throughput": 332.38, "total_tokens": 34812128} {"current_steps": 27495, "total_steps": 40000, "loss": 0.0561, "lr": 0.06672324742146094, "epoch": 1.3434392788214888, "percentage": 68.74, "elapsed_time": "1 day, 5:05:39", "remaining_time": "13:13:56", "throughput": 332.43, "total_tokens": 34818528} {"current_steps": 27500, "total_steps": 40000, "loss": 0.0642, "lr": 0.06667426082467373, "epoch": 1.343683580485183, "percentage": 68.75, "elapsed_time": "1 day, 5:05:42", "remaining_time": "13:13:30", "throughput": 332.48, "total_tokens": 34824448} {"current_steps": 27505, "total_steps": 40000, "loss": 0.0525, "lr": 0.0666252870777626, "epoch": 1.3439278821488774, "percentage": 68.76, "elapsed_time": "1 day, 5:05:45", "remaining_time": "13:13:04", "throughput": 332.54, "total_tokens": 34831680} {"current_steps": 27510, "total_steps": 40000, "loss": 0.0675, "lr": 0.06657632618827995, "epoch": 1.3441721838125718, "percentage": 68.77, "elapsed_time": "1 day, 5:05:48", "remaining_time": "13:12:37", "throughput": 332.58, "total_tokens": 34837728} {"current_steps": 27515, "total_steps": 40000, "loss": 0.0544, "lr": 0.06652737816377623, "epoch": 1.3444164854762661, "percentage": 68.79, "elapsed_time": "1 day, 5:05:51", "remaining_time": "13:12:11", "throughput": 332.63, "total_tokens": 34844160} {"current_steps": 27520, "total_steps": 40000, "loss": 0.0747, "lr": 0.06647844301179971, "epoch": 1.3446607871399605, "percentage": 68.8, "elapsed_time": "1 day, 5:05:55", "remaining_time": "13:11:45", "throughput": 332.68, "total_tokens": 34850048} {"current_steps": 27525, "total_steps": 40000, "loss": 0.0569, "lr": 0.06642952073989689, "epoch": 1.344905088803655, "percentage": 68.81, "elapsed_time": "1 day, 5:05:58", "remaining_time": "13:11:18", "throughput": 332.73, "total_tokens": 34856352} {"current_steps": 27530, "total_steps": 40000, "loss": 0.0712, "lr": 0.06638061135561223, "epoch": 1.345149390467349, "percentage": 68.83, "elapsed_time": "1 day, 5:06:01", "remaining_time": "13:10:52", "throughput": 332.78, "total_tokens": 34862304} {"current_steps": 27535, "total_steps": 40000, "loss": 0.0379, "lr": 0.06633171486648808, "epoch": 1.3453936921310434, "percentage": 68.84, "elapsed_time": "1 day, 5:06:04", "remaining_time": "13:10:26", "throughput": 332.83, "total_tokens": 34868672} {"current_steps": 27540, "total_steps": 40000, "loss": 0.0584, "lr": 0.06628283128006499, "epoch": 1.3456379937947378, "percentage": 68.85, "elapsed_time": "1 day, 5:06:07", "remaining_time": "13:10:00", "throughput": 332.88, "total_tokens": 34875040} {"current_steps": 27545, "total_steps": 40000, "loss": 0.0583, "lr": 0.0662339606038813, "epoch": 1.345882295458432, "percentage": 68.86, "elapsed_time": "1 day, 5:06:10", "remaining_time": "13:09:33", "throughput": 332.93, "total_tokens": 34881024} {"current_steps": 27550, "total_steps": 40000, "loss": 0.0401, "lr": 0.06618510284547358, "epoch": 1.3461265971221263, "percentage": 68.88, "elapsed_time": "1 day, 5:06:13", "remaining_time": "13:09:07", "throughput": 332.98, "total_tokens": 34887040} {"current_steps": 27555, "total_steps": 40000, "loss": 0.0644, "lr": 0.06613625801237633, "epoch": 1.3463708987858207, "percentage": 68.89, "elapsed_time": "1 day, 5:06:16", "remaining_time": "13:08:41", "throughput": 333.03, "total_tokens": 34893376} {"current_steps": 27560, "total_steps": 40000, "loss": 0.082, "lr": 0.066087426112122, "epoch": 1.346615200449515, "percentage": 68.9, "elapsed_time": "1 day, 5:06:19", "remaining_time": "13:08:15", "throughput": 333.08, "total_tokens": 34899648} {"current_steps": 27565, "total_steps": 40000, "loss": 0.0491, "lr": 0.06603860715224101, "epoch": 1.3468595021132095, "percentage": 68.91, "elapsed_time": "1 day, 5:06:22", "remaining_time": "13:07:49", "throughput": 333.13, "total_tokens": 34905824} {"current_steps": 27570, "total_steps": 40000, "loss": 0.0378, "lr": 0.06598980114026198, "epoch": 1.3471038037769036, "percentage": 68.92, "elapsed_time": "1 day, 5:06:25", "remaining_time": "13:07:22", "throughput": 333.18, "total_tokens": 34912352} {"current_steps": 27575, "total_steps": 40000, "loss": 0.0518, "lr": 0.06594100808371128, "epoch": 1.347348105440598, "percentage": 68.94, "elapsed_time": "1 day, 5:06:28", "remaining_time": "13:06:56", "throughput": 333.23, "total_tokens": 34918688} {"current_steps": 27580, "total_steps": 40000, "loss": 0.046, "lr": 0.06589222799011357, "epoch": 1.3475924071042924, "percentage": 68.95, "elapsed_time": "1 day, 5:06:31", "remaining_time": "13:06:30", "throughput": 333.28, "total_tokens": 34924832} {"current_steps": 27585, "total_steps": 40000, "loss": 0.0557, "lr": 0.0658434608669912, "epoch": 1.3478367087679868, "percentage": 68.96, "elapsed_time": "1 day, 5:06:34", "remaining_time": "13:06:04", "throughput": 333.33, "total_tokens": 34931392} {"current_steps": 27590, "total_steps": 40000, "loss": 0.0492, "lr": 0.06579470672186473, "epoch": 1.348081010431681, "percentage": 68.97, "elapsed_time": "1 day, 5:06:37", "remaining_time": "13:05:38", "throughput": 333.39, "total_tokens": 34938240} {"current_steps": 27595, "total_steps": 40000, "loss": 0.0824, "lr": 0.06574596556225275, "epoch": 1.3483253120953753, "percentage": 68.99, "elapsed_time": "1 day, 5:06:40", "remaining_time": "13:05:12", "throughput": 333.44, "total_tokens": 34944320} {"current_steps": 27600, "total_steps": 40000, "loss": 0.0548, "lr": 0.06569723739567161, "epoch": 1.3485696137590697, "percentage": 69.0, "elapsed_time": "1 day, 5:06:44", "remaining_time": "13:04:45", "throughput": 333.49, "total_tokens": 34950976} {"current_steps": 27600, "total_steps": 40000, "eval_loss": 0.06252626329660416, "epoch": 1.3485696137590697, "percentage": 69.0, "elapsed_time": "1 day, 5:17:24", "remaining_time": "13:09:33", "throughput": 331.46, "total_tokens": 34950976} {"current_steps": 27605, "total_steps": 40000, "loss": 0.0607, "lr": 0.06564852222963588, "epoch": 1.348813915422764, "percentage": 69.01, "elapsed_time": "1 day, 5:17:28", "remaining_time": "13:09:07", "throughput": 331.51, "total_tokens": 34957472} {"current_steps": 27610, "total_steps": 40000, "loss": 0.0521, "lr": 0.06559982007165813, "epoch": 1.3490582170864585, "percentage": 69.03, "elapsed_time": "1 day, 5:17:31", "remaining_time": "13:08:41", "throughput": 331.56, "total_tokens": 34963488} {"current_steps": 27615, "total_steps": 40000, "loss": 0.0546, "lr": 0.06555113092924868, "epoch": 1.3493025187501526, "percentage": 69.04, "elapsed_time": "1 day, 5:17:34", "remaining_time": "13:08:15", "throughput": 331.61, "total_tokens": 34969344} {"current_steps": 27620, "total_steps": 40000, "loss": 0.0514, "lr": 0.06550245480991615, "epoch": 1.349546820413847, "percentage": 69.05, "elapsed_time": "1 day, 5:17:37", "remaining_time": "13:07:48", "throughput": 331.66, "total_tokens": 34975776} {"current_steps": 27625, "total_steps": 40000, "loss": 0.0586, "lr": 0.0654537917211669, "epoch": 1.3497911220775414, "percentage": 69.06, "elapsed_time": "1 day, 5:17:40", "remaining_time": "13:07:22", "throughput": 331.71, "total_tokens": 34982144} {"current_steps": 27630, "total_steps": 40000, "loss": 0.0438, "lr": 0.0654051416705055, "epoch": 1.3500354237412358, "percentage": 69.08, "elapsed_time": "1 day, 5:17:43", "remaining_time": "13:06:56", "throughput": 331.76, "total_tokens": 34988800} {"current_steps": 27635, "total_steps": 40000, "loss": 0.0912, "lr": 0.06535650466543427, "epoch": 1.35027972540493, "percentage": 69.09, "elapsed_time": "1 day, 5:17:46", "remaining_time": "13:06:30", "throughput": 331.81, "total_tokens": 34994944} {"current_steps": 27640, "total_steps": 40000, "loss": 0.0388, "lr": 0.0653078807134538, "epoch": 1.3505240270686243, "percentage": 69.1, "elapsed_time": "1 day, 5:17:50", "remaining_time": "13:06:03", "throughput": 331.87, "total_tokens": 35001888} {"current_steps": 27645, "total_steps": 40000, "loss": 0.0629, "lr": 0.06525926982206236, "epoch": 1.3507683287323187, "percentage": 69.11, "elapsed_time": "1 day, 5:17:53", "remaining_time": "13:05:37", "throughput": 331.92, "total_tokens": 35008128} {"current_steps": 27650, "total_steps": 40000, "loss": 0.0585, "lr": 0.06521067199875648, "epoch": 1.351012630396013, "percentage": 69.12, "elapsed_time": "1 day, 5:17:56", "remaining_time": "13:05:11", "throughput": 331.96, "total_tokens": 35014368} {"current_steps": 27655, "total_steps": 40000, "loss": 0.043, "lr": 0.06516208725103047, "epoch": 1.3512569320597074, "percentage": 69.14, "elapsed_time": "1 day, 5:17:59", "remaining_time": "13:04:45", "throughput": 332.01, "total_tokens": 35020576} {"current_steps": 27660, "total_steps": 40000, "loss": 0.0407, "lr": 0.06511351558637678, "epoch": 1.3515012337234016, "percentage": 69.15, "elapsed_time": "1 day, 5:18:02", "remaining_time": "13:04:19", "throughput": 332.06, "total_tokens": 35026752} {"current_steps": 27665, "total_steps": 40000, "loss": 0.0945, "lr": 0.06506495701228569, "epoch": 1.351745535387096, "percentage": 69.16, "elapsed_time": "1 day, 5:18:05", "remaining_time": "13:03:52", "throughput": 332.11, "total_tokens": 35032608} {"current_steps": 27670, "total_steps": 40000, "loss": 0.0781, "lr": 0.06501641153624559, "epoch": 1.3519898370507903, "percentage": 69.17, "elapsed_time": "1 day, 5:18:08", "remaining_time": "13:03:26", "throughput": 332.16, "total_tokens": 35039008} {"current_steps": 27675, "total_steps": 40000, "loss": 0.0672, "lr": 0.06496787916574286, "epoch": 1.3522341387144847, "percentage": 69.19, "elapsed_time": "1 day, 5:18:11", "remaining_time": "13:03:00", "throughput": 332.21, "total_tokens": 35045248} {"current_steps": 27680, "total_steps": 40000, "loss": 0.045, "lr": 0.06491935990826168, "epoch": 1.3524784403781789, "percentage": 69.2, "elapsed_time": "1 day, 5:18:14", "remaining_time": "13:02:34", "throughput": 332.26, "total_tokens": 35051488} {"current_steps": 27685, "total_steps": 40000, "loss": 0.0406, "lr": 0.0648708537712844, "epoch": 1.3527227420418733, "percentage": 69.21, "elapsed_time": "1 day, 5:18:17", "remaining_time": "13:02:08", "throughput": 332.31, "total_tokens": 35057856} {"current_steps": 27690, "total_steps": 40000, "loss": 0.0589, "lr": 0.06482236076229132, "epoch": 1.3529670437055676, "percentage": 69.23, "elapsed_time": "1 day, 5:18:20", "remaining_time": "13:01:41", "throughput": 332.36, "total_tokens": 35064256} {"current_steps": 27695, "total_steps": 40000, "loss": 0.0746, "lr": 0.06477388088876056, "epoch": 1.353211345369262, "percentage": 69.24, "elapsed_time": "1 day, 5:18:23", "remaining_time": "13:01:15", "throughput": 332.41, "total_tokens": 35071040} {"current_steps": 27700, "total_steps": 40000, "loss": 0.0779, "lr": 0.06472541415816846, "epoch": 1.3534556470329564, "percentage": 69.25, "elapsed_time": "1 day, 5:18:27", "remaining_time": "13:00:49", "throughput": 332.46, "total_tokens": 35077280} {"current_steps": 27705, "total_steps": 40000, "loss": 0.0367, "lr": 0.06467696057798909, "epoch": 1.3536999486966506, "percentage": 69.26, "elapsed_time": "1 day, 5:18:30", "remaining_time": "13:00:23", "throughput": 332.51, "total_tokens": 35083456} {"current_steps": 27710, "total_steps": 40000, "loss": 0.0502, "lr": 0.0646285201556946, "epoch": 1.353944250360345, "percentage": 69.27, "elapsed_time": "1 day, 5:18:33", "remaining_time": "12:59:57", "throughput": 332.56, "total_tokens": 35089952} {"current_steps": 27715, "total_steps": 40000, "loss": 0.049, "lr": 0.06458009289875521, "epoch": 1.3541885520240393, "percentage": 69.29, "elapsed_time": "1 day, 5:18:36", "remaining_time": "12:59:31", "throughput": 332.62, "total_tokens": 35096960} {"current_steps": 27720, "total_steps": 40000, "loss": 0.0412, "lr": 0.0645316788146389, "epoch": 1.3544328536877337, "percentage": 69.3, "elapsed_time": "1 day, 5:18:39", "remaining_time": "12:59:05", "throughput": 332.67, "total_tokens": 35102944} {"current_steps": 27725, "total_steps": 40000, "loss": 0.0426, "lr": 0.06448327791081175, "epoch": 1.3546771553514279, "percentage": 69.31, "elapsed_time": "1 day, 5:18:42", "remaining_time": "12:58:39", "throughput": 332.72, "total_tokens": 35109216} {"current_steps": 27730, "total_steps": 40000, "loss": 0.1011, "lr": 0.0644348901947379, "epoch": 1.3549214570151222, "percentage": 69.33, "elapsed_time": "1 day, 5:18:45", "remaining_time": "12:58:13", "throughput": 332.76, "total_tokens": 35115136} {"current_steps": 27735, "total_steps": 40000, "loss": 0.043, "lr": 0.06438651567387917, "epoch": 1.3551657586788166, "percentage": 69.34, "elapsed_time": "1 day, 5:18:48", "remaining_time": "12:57:46", "throughput": 332.81, "total_tokens": 35121248} {"current_steps": 27740, "total_steps": 40000, "loss": 0.0525, "lr": 0.0643381543556957, "epoch": 1.355410060342511, "percentage": 69.35, "elapsed_time": "1 day, 5:18:51", "remaining_time": "12:57:20", "throughput": 332.86, "total_tokens": 35127328} {"current_steps": 27745, "total_steps": 40000, "loss": 0.0666, "lr": 0.06428980624764526, "epoch": 1.3556543620062054, "percentage": 69.36, "elapsed_time": "1 day, 5:18:54", "remaining_time": "12:56:54", "throughput": 332.91, "total_tokens": 35133248} {"current_steps": 27750, "total_steps": 40000, "loss": 0.0693, "lr": 0.06424147135718378, "epoch": 1.3558986636698995, "percentage": 69.38, "elapsed_time": "1 day, 5:18:57", "remaining_time": "12:56:28", "throughput": 332.96, "total_tokens": 35140000} {"current_steps": 27755, "total_steps": 40000, "loss": 0.0404, "lr": 0.06419314969176519, "epoch": 1.356142965333594, "percentage": 69.39, "elapsed_time": "1 day, 5:19:00", "remaining_time": "12:56:02", "throughput": 333.01, "total_tokens": 35146272} {"current_steps": 27760, "total_steps": 40000, "loss": 0.0799, "lr": 0.06414484125884118, "epoch": 1.3563872669972883, "percentage": 69.4, "elapsed_time": "1 day, 5:19:03", "remaining_time": "12:55:36", "throughput": 333.06, "total_tokens": 35152352} {"current_steps": 27765, "total_steps": 40000, "loss": 0.0387, "lr": 0.06409654606586157, "epoch": 1.3566315686609824, "percentage": 69.41, "elapsed_time": "1 day, 5:19:07", "remaining_time": "12:55:10", "throughput": 333.11, "total_tokens": 35158784} {"current_steps": 27770, "total_steps": 40000, "loss": 0.0674, "lr": 0.06404826412027415, "epoch": 1.3568758703246768, "percentage": 69.42, "elapsed_time": "1 day, 5:19:10", "remaining_time": "12:54:44", "throughput": 333.16, "total_tokens": 35165312} {"current_steps": 27775, "total_steps": 40000, "loss": 0.0569, "lr": 0.06399999542952453, "epoch": 1.3571201719883712, "percentage": 69.44, "elapsed_time": "1 day, 5:19:13", "remaining_time": "12:54:18", "throughput": 333.21, "total_tokens": 35171680} {"current_steps": 27780, "total_steps": 40000, "loss": 0.0578, "lr": 0.0639517400010563, "epoch": 1.3573644736520656, "percentage": 69.45, "elapsed_time": "1 day, 5:19:16", "remaining_time": "12:53:52", "throughput": 333.26, "total_tokens": 35178048} {"current_steps": 27785, "total_steps": 40000, "loss": 0.037, "lr": 0.06390349784231118, "epoch": 1.35760877531576, "percentage": 69.46, "elapsed_time": "1 day, 5:19:19", "remaining_time": "12:53:26", "throughput": 333.32, "total_tokens": 35184896} {"current_steps": 27790, "total_steps": 40000, "loss": 0.0502, "lr": 0.06385526896072859, "epoch": 1.3578530769794543, "percentage": 69.47, "elapsed_time": "1 day, 5:19:22", "remaining_time": "12:53:00", "throughput": 333.37, "total_tokens": 35191552} {"current_steps": 27795, "total_steps": 40000, "loss": 0.0469, "lr": 0.06380705336374613, "epoch": 1.3580973786431485, "percentage": 69.49, "elapsed_time": "1 day, 5:19:25", "remaining_time": "12:52:34", "throughput": 333.42, "total_tokens": 35197888} {"current_steps": 27800, "total_steps": 40000, "loss": 0.059, "lr": 0.06375885105879918, "epoch": 1.3583416803068429, "percentage": 69.5, "elapsed_time": "1 day, 5:19:28", "remaining_time": "12:52:08", "throughput": 333.47, "total_tokens": 35204128} {"current_steps": 27800, "total_steps": 40000, "eval_loss": 0.06430228799581528, "epoch": 1.3583416803068429, "percentage": 69.5, "elapsed_time": "1 day, 5:30:08", "remaining_time": "12:56:49", "throughput": 331.46, "total_tokens": 35204128} {"current_steps": 27805, "total_steps": 40000, "loss": 0.0426, "lr": 0.06371066205332115, "epoch": 1.3585859819705373, "percentage": 69.51, "elapsed_time": "1 day, 5:30:12", "remaining_time": "12:56:23", "throughput": 331.51, "total_tokens": 35210464} {"current_steps": 27810, "total_steps": 40000, "loss": 0.0559, "lr": 0.06366248635474347, "epoch": 1.3588302836342314, "percentage": 69.53, "elapsed_time": "1 day, 5:30:15", "remaining_time": "12:55:57", "throughput": 331.56, "total_tokens": 35216544} {"current_steps": 27815, "total_steps": 40000, "loss": 0.0729, "lr": 0.06361432397049532, "epoch": 1.3590745852979258, "percentage": 69.54, "elapsed_time": "1 day, 5:30:18", "remaining_time": "12:55:31", "throughput": 331.61, "total_tokens": 35222976} {"current_steps": 27820, "total_steps": 40000, "loss": 0.0544, "lr": 0.06356617490800408, "epoch": 1.3593188869616202, "percentage": 69.55, "elapsed_time": "1 day, 5:30:21", "remaining_time": "12:55:05", "throughput": 331.66, "total_tokens": 35229824} {"current_steps": 27825, "total_steps": 40000, "loss": 0.034, "lr": 0.06351803917469478, "epoch": 1.3595631886253146, "percentage": 69.56, "elapsed_time": "1 day, 5:30:24", "remaining_time": "12:54:39", "throughput": 331.72, "total_tokens": 35236416} {"current_steps": 27830, "total_steps": 40000, "loss": 0.0226, "lr": 0.06346991677799067, "epoch": 1.359807490289009, "percentage": 69.58, "elapsed_time": "1 day, 5:30:27", "remaining_time": "12:54:13", "throughput": 331.77, "total_tokens": 35242656} {"current_steps": 27835, "total_steps": 40000, "loss": 0.0496, "lr": 0.06342180772531283, "epoch": 1.3600517919527033, "percentage": 69.59, "elapsed_time": "1 day, 5:30:30", "remaining_time": "12:53:47", "throughput": 331.82, "total_tokens": 35249440} {"current_steps": 27840, "total_steps": 40000, "loss": 0.0419, "lr": 0.06337371202408021, "epoch": 1.3602960936163975, "percentage": 69.6, "elapsed_time": "1 day, 5:30:33", "remaining_time": "12:53:21", "throughput": 331.87, "total_tokens": 35255552} {"current_steps": 27845, "total_steps": 40000, "loss": 0.0369, "lr": 0.06332562968170984, "epoch": 1.3605403952800919, "percentage": 69.61, "elapsed_time": "1 day, 5:30:37", "remaining_time": "12:52:54", "throughput": 331.91, "total_tokens": 35261632} {"current_steps": 27850, "total_steps": 40000, "loss": 0.0623, "lr": 0.06327756070561656, "epoch": 1.3607846969437862, "percentage": 69.62, "elapsed_time": "1 day, 5:30:40", "remaining_time": "12:52:28", "throughput": 331.97, "total_tokens": 35268416} {"current_steps": 27855, "total_steps": 40000, "loss": 0.0597, "lr": 0.06322950510321329, "epoch": 1.3610289986074804, "percentage": 69.64, "elapsed_time": "1 day, 5:30:43", "remaining_time": "12:52:02", "throughput": 332.02, "total_tokens": 35274624} {"current_steps": 27860, "total_steps": 40000, "loss": 0.0649, "lr": 0.06318146288191076, "epoch": 1.3612733002711748, "percentage": 69.65, "elapsed_time": "1 day, 5:30:46", "remaining_time": "12:51:36", "throughput": 332.07, "total_tokens": 35281536} {"current_steps": 27865, "total_steps": 40000, "loss": 0.0627, "lr": 0.06313343404911763, "epoch": 1.3615176019348691, "percentage": 69.66, "elapsed_time": "1 day, 5:30:49", "remaining_time": "12:51:10", "throughput": 332.12, "total_tokens": 35287616} {"current_steps": 27870, "total_steps": 40000, "loss": 0.0544, "lr": 0.0630854186122406, "epoch": 1.3617619035985635, "percentage": 69.67, "elapsed_time": "1 day, 5:30:52", "remaining_time": "12:50:44", "throughput": 332.17, "total_tokens": 35293920} {"current_steps": 27875, "total_steps": 40000, "loss": 0.0527, "lr": 0.06303741657868431, "epoch": 1.362006205262258, "percentage": 69.69, "elapsed_time": "1 day, 5:30:55", "remaining_time": "12:50:18", "throughput": 332.22, "total_tokens": 35300128} {"current_steps": 27880, "total_steps": 40000, "loss": 0.0639, "lr": 0.06298942795585115, "epoch": 1.3622505069259523, "percentage": 69.7, "elapsed_time": "1 day, 5:30:58", "remaining_time": "12:49:52", "throughput": 332.27, "total_tokens": 35306208} {"current_steps": 27885, "total_steps": 40000, "loss": 0.095, "lr": 0.06294145275114167, "epoch": 1.3624948085896464, "percentage": 69.71, "elapsed_time": "1 day, 5:31:01", "remaining_time": "12:49:26", "throughput": 332.31, "total_tokens": 35312288} {"current_steps": 27890, "total_steps": 40000, "loss": 0.0695, "lr": 0.06289349097195428, "epoch": 1.3627391102533408, "percentage": 69.73, "elapsed_time": "1 day, 5:31:04", "remaining_time": "12:49:00", "throughput": 332.36, "total_tokens": 35318272} {"current_steps": 27895, "total_steps": 40000, "loss": 0.064, "lr": 0.06284554262568516, "epoch": 1.3629834119170352, "percentage": 69.74, "elapsed_time": "1 day, 5:31:07", "remaining_time": "12:48:34", "throughput": 332.41, "total_tokens": 35324352} {"current_steps": 27900, "total_steps": 40000, "loss": 0.0526, "lr": 0.06279760771972868, "epoch": 1.3632277135807294, "percentage": 69.75, "elapsed_time": "1 day, 5:31:10", "remaining_time": "12:48:08", "throughput": 332.46, "total_tokens": 35330400} {"current_steps": 27905, "total_steps": 40000, "loss": 0.0603, "lr": 0.06274968626147688, "epoch": 1.3634720152444237, "percentage": 69.76, "elapsed_time": "1 day, 5:31:13", "remaining_time": "12:47:42", "throughput": 332.5, "total_tokens": 35336480} {"current_steps": 27910, "total_steps": 40000, "loss": 0.0317, "lr": 0.06270177825831993, "epoch": 1.3637163169081181, "percentage": 69.77, "elapsed_time": "1 day, 5:31:16", "remaining_time": "12:47:16", "throughput": 332.56, "total_tokens": 35343168} {"current_steps": 27915, "total_steps": 40000, "loss": 0.0706, "lr": 0.06265388371764587, "epoch": 1.3639606185718125, "percentage": 69.79, "elapsed_time": "1 day, 5:31:19", "remaining_time": "12:46:50", "throughput": 332.61, "total_tokens": 35349408} {"current_steps": 27920, "total_steps": 40000, "loss": 0.049, "lr": 0.0626060026468406, "epoch": 1.3642049202355069, "percentage": 69.8, "elapsed_time": "1 day, 5:31:22", "remaining_time": "12:46:24", "throughput": 332.65, "total_tokens": 35355392} {"current_steps": 27925, "total_steps": 40000, "loss": 0.055, "lr": 0.06255813505328794, "epoch": 1.3644492218992013, "percentage": 69.81, "elapsed_time": "1 day, 5:31:25", "remaining_time": "12:45:58", "throughput": 332.7, "total_tokens": 35361664} {"current_steps": 27930, "total_steps": 40000, "loss": 0.0512, "lr": 0.06251028094436978, "epoch": 1.3646935235628954, "percentage": 69.83, "elapsed_time": "1 day, 5:31:28", "remaining_time": "12:45:32", "throughput": 332.75, "total_tokens": 35367968} {"current_steps": 27935, "total_steps": 40000, "loss": 0.0644, "lr": 0.06246244032746568, "epoch": 1.3649378252265898, "percentage": 69.84, "elapsed_time": "1 day, 5:31:31", "remaining_time": "12:45:06", "throughput": 332.8, "total_tokens": 35373888} {"current_steps": 27940, "total_steps": 40000, "loss": 0.0574, "lr": 0.06241461320995342, "epoch": 1.3651821268902842, "percentage": 69.85, "elapsed_time": "1 day, 5:31:35", "remaining_time": "12:44:41", "throughput": 332.85, "total_tokens": 35380320} {"current_steps": 27945, "total_steps": 40000, "loss": 0.0414, "lr": 0.062366799599208426, "epoch": 1.3654264285539783, "percentage": 69.86, "elapsed_time": "1 day, 5:31:38", "remaining_time": "12:44:15", "throughput": 332.9, "total_tokens": 35386688} {"current_steps": 27950, "total_steps": 40000, "loss": 0.0515, "lr": 0.06231899950260418, "epoch": 1.3656707302176727, "percentage": 69.88, "elapsed_time": "1 day, 5:31:41", "remaining_time": "12:43:49", "throughput": 332.95, "total_tokens": 35392608} {"current_steps": 27955, "total_steps": 40000, "loss": 0.0347, "lr": 0.06227121292751214, "epoch": 1.365915031881367, "percentage": 69.89, "elapsed_time": "1 day, 5:31:44", "remaining_time": "12:43:23", "throughput": 332.99, "total_tokens": 35398688} {"current_steps": 27960, "total_steps": 40000, "loss": 0.0655, "lr": 0.062223439881301496, "epoch": 1.3661593335450615, "percentage": 69.9, "elapsed_time": "1 day, 5:31:47", "remaining_time": "12:42:57", "throughput": 333.04, "total_tokens": 35404768} {"current_steps": 27965, "total_steps": 40000, "loss": 0.0529, "lr": 0.06217568037133948, "epoch": 1.3664036352087559, "percentage": 69.91, "elapsed_time": "1 day, 5:31:50", "remaining_time": "12:42:31", "throughput": 333.09, "total_tokens": 35411296} {"current_steps": 27970, "total_steps": 40000, "loss": 0.0687, "lr": 0.06212793440499126, "epoch": 1.3666479368724502, "percentage": 69.92, "elapsed_time": "1 day, 5:31:53", "remaining_time": "12:42:05", "throughput": 333.14, "total_tokens": 35417440} {"current_steps": 27975, "total_steps": 40000, "loss": 0.0753, "lr": 0.062080201989619783, "epoch": 1.3668922385361444, "percentage": 69.94, "elapsed_time": "1 day, 5:31:56", "remaining_time": "12:41:40", "throughput": 333.19, "total_tokens": 35423968} {"current_steps": 27980, "total_steps": 40000, "loss": 0.0964, "lr": 0.062032483132586094, "epoch": 1.3671365401998388, "percentage": 69.95, "elapsed_time": "1 day, 5:31:59", "remaining_time": "12:41:14", "throughput": 333.24, "total_tokens": 35430144} {"current_steps": 27985, "total_steps": 40000, "loss": 0.0674, "lr": 0.0619847778412489, "epoch": 1.3673808418635331, "percentage": 69.96, "elapsed_time": "1 day, 5:32:02", "remaining_time": "12:40:48", "throughput": 333.29, "total_tokens": 35436192} {"current_steps": 27990, "total_steps": 40000, "loss": 0.0594, "lr": 0.06193708612296509, "epoch": 1.3676251435272273, "percentage": 69.97, "elapsed_time": "1 day, 5:32:05", "remaining_time": "12:40:22", "throughput": 333.34, "total_tokens": 35442368} {"current_steps": 27995, "total_steps": 40000, "loss": 0.0547, "lr": 0.06188940798508923, "epoch": 1.3678694451909217, "percentage": 69.99, "elapsed_time": "1 day, 5:32:08", "remaining_time": "12:39:56", "throughput": 333.38, "total_tokens": 35448288} {"current_steps": 28000, "total_steps": 40000, "loss": 0.0463, "lr": 0.06184174343497397, "epoch": 1.368113746854616, "percentage": 70.0, "elapsed_time": "1 day, 5:32:12", "remaining_time": "12:39:30", "throughput": 333.44, "total_tokens": 35455296} {"current_steps": 28000, "total_steps": 40000, "eval_loss": 0.06326847523450851, "epoch": 1.368113746854616, "percentage": 70.0, "elapsed_time": "1 day, 5:42:52", "remaining_time": "12:44:05", "throughput": 331.44, "total_tokens": 35455296} {"current_steps": 28005, "total_steps": 40000, "loss": 0.0365, "lr": 0.061794092479969726, "epoch": 1.3683580485183104, "percentage": 70.01, "elapsed_time": "1 day, 5:42:56", "remaining_time": "12:43:39", "throughput": 331.49, "total_tokens": 35461696} {"current_steps": 28010, "total_steps": 40000, "loss": 0.0315, "lr": 0.06174645512742485, "epoch": 1.3686023501820048, "percentage": 70.03, "elapsed_time": "1 day, 5:42:59", "remaining_time": "12:43:13", "throughput": 331.54, "total_tokens": 35467552} {"current_steps": 28015, "total_steps": 40000, "loss": 0.0671, "lr": 0.06169883138468565, "epoch": 1.3688466518456992, "percentage": 70.04, "elapsed_time": "1 day, 5:43:02", "remaining_time": "12:42:47", "throughput": 331.59, "total_tokens": 35474240} {"current_steps": 28020, "total_steps": 40000, "loss": 0.0605, "lr": 0.06165122125909637, "epoch": 1.3690909535093934, "percentage": 70.05, "elapsed_time": "1 day, 5:43:05", "remaining_time": "12:42:22", "throughput": 331.64, "total_tokens": 35480704} {"current_steps": 28025, "total_steps": 40000, "loss": 0.0595, "lr": 0.061603624757998965, "epoch": 1.3693352551730877, "percentage": 70.06, "elapsed_time": "1 day, 5:43:08", "remaining_time": "12:41:56", "throughput": 331.69, "total_tokens": 35486848} {"current_steps": 28030, "total_steps": 40000, "loss": 0.0554, "lr": 0.0615560418887335, "epoch": 1.3695795568367821, "percentage": 70.08, "elapsed_time": "1 day, 5:43:12", "remaining_time": "12:41:30", "throughput": 331.74, "total_tokens": 35493216} {"current_steps": 28035, "total_steps": 40000, "loss": 0.0585, "lr": 0.06150847265863787, "epoch": 1.3698238585004763, "percentage": 70.09, "elapsed_time": "1 day, 5:43:15", "remaining_time": "12:41:04", "throughput": 331.79, "total_tokens": 35499744} {"current_steps": 28040, "total_steps": 40000, "loss": 0.0441, "lr": 0.061460917075047757, "epoch": 1.3700681601641707, "percentage": 70.1, "elapsed_time": "1 day, 5:43:18", "remaining_time": "12:40:38", "throughput": 331.83, "total_tokens": 35505664} {"current_steps": 28045, "total_steps": 40000, "loss": 0.0347, "lr": 0.06141337514529694, "epoch": 1.370312461827865, "percentage": 70.11, "elapsed_time": "1 day, 5:43:21", "remaining_time": "12:40:12", "throughput": 331.89, "total_tokens": 35512192} {"current_steps": 28050, "total_steps": 40000, "loss": 0.0841, "lr": 0.06136584687671687, "epoch": 1.3705567634915594, "percentage": 70.12, "elapsed_time": "1 day, 5:43:24", "remaining_time": "12:39:46", "throughput": 331.93, "total_tokens": 35518304} {"current_steps": 28055, "total_steps": 40000, "loss": 0.0484, "lr": 0.061318332276637064, "epoch": 1.3708010651552538, "percentage": 70.14, "elapsed_time": "1 day, 5:43:27", "remaining_time": "12:39:20", "throughput": 331.98, "total_tokens": 35524480} {"current_steps": 28060, "total_steps": 40000, "loss": 0.0496, "lr": 0.06127083135238491, "epoch": 1.3710453668189482, "percentage": 70.15, "elapsed_time": "1 day, 5:43:30", "remaining_time": "12:38:54", "throughput": 332.03, "total_tokens": 35530496} {"current_steps": 28065, "total_steps": 40000, "loss": 0.0725, "lr": 0.06122334411128555, "epoch": 1.3712896684826423, "percentage": 70.16, "elapsed_time": "1 day, 5:43:33", "remaining_time": "12:38:28", "throughput": 332.08, "total_tokens": 35536768} {"current_steps": 28070, "total_steps": 40000, "loss": 0.0655, "lr": 0.06117587056066223, "epoch": 1.3715339701463367, "percentage": 70.17, "elapsed_time": "1 day, 5:43:36", "remaining_time": "12:38:03", "throughput": 332.13, "total_tokens": 35543648} {"current_steps": 28075, "total_steps": 40000, "loss": 0.0498, "lr": 0.06112841070783589, "epoch": 1.371778271810031, "percentage": 70.19, "elapsed_time": "1 day, 5:43:39", "remaining_time": "12:37:37", "throughput": 332.18, "total_tokens": 35549856} {"current_steps": 28080, "total_steps": 40000, "loss": 0.0723, "lr": 0.061080964560125406, "epoch": 1.3720225734737252, "percentage": 70.2, "elapsed_time": "1 day, 5:43:42", "remaining_time": "12:37:11", "throughput": 332.23, "total_tokens": 35556064} {"current_steps": 28085, "total_steps": 40000, "loss": 0.0403, "lr": 0.06103353212484766, "epoch": 1.3722668751374196, "percentage": 70.21, "elapsed_time": "1 day, 5:43:45", "remaining_time": "12:36:45", "throughput": 332.28, "total_tokens": 35562368} {"current_steps": 28090, "total_steps": 40000, "loss": 0.0668, "lr": 0.06098611340931722, "epoch": 1.372511176801114, "percentage": 70.23, "elapsed_time": "1 day, 5:43:48", "remaining_time": "12:36:19", "throughput": 332.33, "total_tokens": 35568640} {"current_steps": 28095, "total_steps": 40000, "loss": 0.0787, "lr": 0.06093870842084672, "epoch": 1.3727554784648084, "percentage": 70.24, "elapsed_time": "1 day, 5:43:51", "remaining_time": "12:35:53", "throughput": 332.37, "total_tokens": 35574720} {"current_steps": 28100, "total_steps": 40000, "loss": 0.0513, "lr": 0.06089131716674666, "epoch": 1.3729997801285028, "percentage": 70.25, "elapsed_time": "1 day, 5:43:55", "remaining_time": "12:35:28", "throughput": 332.43, "total_tokens": 35581216} {"current_steps": 28105, "total_steps": 40000, "loss": 0.0584, "lr": 0.060843939654325226, "epoch": 1.373244081792197, "percentage": 70.26, "elapsed_time": "1 day, 5:43:58", "remaining_time": "12:35:02", "throughput": 332.48, "total_tokens": 35587584} {"current_steps": 28110, "total_steps": 40000, "loss": 0.0545, "lr": 0.06079657589088873, "epoch": 1.3734883834558913, "percentage": 70.28, "elapsed_time": "1 day, 5:44:01", "remaining_time": "12:34:36", "throughput": 332.53, "total_tokens": 35594016} {"current_steps": 28115, "total_steps": 40000, "loss": 0.0668, "lr": 0.06074922588374126, "epoch": 1.3737326851195857, "percentage": 70.29, "elapsed_time": "1 day, 5:44:04", "remaining_time": "12:34:10", "throughput": 332.57, "total_tokens": 35600288} {"current_steps": 28120, "total_steps": 40000, "loss": 0.0533, "lr": 0.06070188964018472, "epoch": 1.37397698678328, "percentage": 70.3, "elapsed_time": "1 day, 5:44:07", "remaining_time": "12:33:44", "throughput": 332.62, "total_tokens": 35606272} {"current_steps": 28125, "total_steps": 40000, "loss": 0.0382, "lr": 0.06065456716751902, "epoch": 1.3742212884469742, "percentage": 70.31, "elapsed_time": "1 day, 5:44:10", "remaining_time": "12:33:19", "throughput": 332.68, "total_tokens": 35613088} {"current_steps": 28130, "total_steps": 40000, "loss": 0.0691, "lr": 0.06060725847304182, "epoch": 1.3744655901106686, "percentage": 70.33, "elapsed_time": "1 day, 5:44:13", "remaining_time": "12:32:53", "throughput": 332.72, "total_tokens": 35619040} {"current_steps": 28135, "total_steps": 40000, "loss": 0.0475, "lr": 0.06055996356404877, "epoch": 1.374709891774363, "percentage": 70.34, "elapsed_time": "1 day, 5:44:16", "remaining_time": "12:32:27", "throughput": 332.77, "total_tokens": 35625472} {"current_steps": 28140, "total_steps": 40000, "loss": 0.0792, "lr": 0.06051268244783327, "epoch": 1.3749541934380574, "percentage": 70.35, "elapsed_time": "1 day, 5:44:19", "remaining_time": "12:32:01", "throughput": 332.82, "total_tokens": 35631872} {"current_steps": 28145, "total_steps": 40000, "loss": 0.0374, "lr": 0.06046541513168676, "epoch": 1.3751984951017517, "percentage": 70.36, "elapsed_time": "1 day, 5:44:22", "remaining_time": "12:31:36", "throughput": 332.87, "total_tokens": 35638272} {"current_steps": 28150, "total_steps": 40000, "loss": 0.0741, "lr": 0.060418161622898356, "epoch": 1.375442796765446, "percentage": 70.38, "elapsed_time": "1 day, 5:44:25", "remaining_time": "12:31:10", "throughput": 332.92, "total_tokens": 35644384} {"current_steps": 28155, "total_steps": 40000, "loss": 0.0395, "lr": 0.06037092192875521, "epoch": 1.3756870984291403, "percentage": 70.39, "elapsed_time": "1 day, 5:44:29", "remaining_time": "12:30:44", "throughput": 332.98, "total_tokens": 35651392} {"current_steps": 28160, "total_steps": 40000, "loss": 0.078, "lr": 0.060323696056542225, "epoch": 1.3759314000928347, "percentage": 70.4, "elapsed_time": "1 day, 5:44:32", "remaining_time": "12:30:19", "throughput": 333.03, "total_tokens": 35657920} {"current_steps": 28165, "total_steps": 40000, "loss": 0.0428, "lr": 0.06027648401354229, "epoch": 1.376175701756529, "percentage": 70.41, "elapsed_time": "1 day, 5:44:35", "remaining_time": "12:29:53", "throughput": 333.07, "total_tokens": 35663776} {"current_steps": 28170, "total_steps": 40000, "loss": 0.051, "lr": 0.06022928580703601, "epoch": 1.3764200034202232, "percentage": 70.43, "elapsed_time": "1 day, 5:44:38", "remaining_time": "12:29:27", "throughput": 333.13, "total_tokens": 35671040} {"current_steps": 28175, "total_steps": 40000, "loss": 0.0586, "lr": 0.060182101444301986, "epoch": 1.3766643050839176, "percentage": 70.44, "elapsed_time": "1 day, 5:44:41", "remaining_time": "12:29:01", "throughput": 333.18, "total_tokens": 35677056} {"current_steps": 28180, "total_steps": 40000, "loss": 0.0509, "lr": 0.06013493093261669, "epoch": 1.376908606747612, "percentage": 70.45, "elapsed_time": "1 day, 5:44:44", "remaining_time": "12:28:36", "throughput": 333.23, "total_tokens": 35683584} {"current_steps": 28185, "total_steps": 40000, "loss": 0.0595, "lr": 0.06008777427925432, "epoch": 1.3771529084113063, "percentage": 70.46, "elapsed_time": "1 day, 5:44:47", "remaining_time": "12:28:10", "throughput": 333.27, "total_tokens": 35689600} {"current_steps": 28190, "total_steps": 40000, "loss": 0.0777, "lr": 0.06004063149148705, "epoch": 1.3773972100750007, "percentage": 70.47, "elapsed_time": "1 day, 5:44:50", "remaining_time": "12:27:44", "throughput": 333.32, "total_tokens": 35695648} {"current_steps": 28195, "total_steps": 40000, "loss": 0.0475, "lr": 0.05999350257658497, "epoch": 1.3776415117386949, "percentage": 70.49, "elapsed_time": "1 day, 5:44:53", "remaining_time": "12:27:19", "throughput": 333.37, "total_tokens": 35701984} {"current_steps": 28200, "total_steps": 40000, "loss": 0.1003, "lr": 0.05994638754181582, "epoch": 1.3778858134023892, "percentage": 70.5, "elapsed_time": "1 day, 5:44:56", "remaining_time": "12:26:53", "throughput": 333.42, "total_tokens": 35708160} {"current_steps": 28200, "total_steps": 40000, "eval_loss": 0.0620783232152462, "epoch": 1.3778858134023892, "percentage": 70.5, "elapsed_time": "1 day, 5:55:37", "remaining_time": "12:31:21", "throughput": 331.44, "total_tokens": 35708160} {"current_steps": 28205, "total_steps": 40000, "loss": 0.0667, "lr": 0.059899286394445445, "epoch": 1.3781301150660836, "percentage": 70.51, "elapsed_time": "1 day, 5:55:41", "remaining_time": "12:30:56", "throughput": 331.48, "total_tokens": 35714560} {"current_steps": 28210, "total_steps": 40000, "loss": 0.0416, "lr": 0.059852199141737346, "epoch": 1.378374416729778, "percentage": 70.53, "elapsed_time": "1 day, 5:55:44", "remaining_time": "12:30:30", "throughput": 331.53, "total_tokens": 35720672} {"current_steps": 28215, "total_steps": 40000, "loss": 0.0557, "lr": 0.05980512579095304, "epoch": 1.3786187183934722, "percentage": 70.54, "elapsed_time": "1 day, 5:55:47", "remaining_time": "12:30:04", "throughput": 331.58, "total_tokens": 35726656} {"current_steps": 28220, "total_steps": 40000, "loss": 0.0549, "lr": 0.05975806634935181, "epoch": 1.3788630200571665, "percentage": 70.55, "elapsed_time": "1 day, 5:55:50", "remaining_time": "12:29:38", "throughput": 331.63, "total_tokens": 35733088} {"current_steps": 28225, "total_steps": 40000, "loss": 0.05, "lr": 0.05971102082419076, "epoch": 1.379107321720861, "percentage": 70.56, "elapsed_time": "1 day, 5:55:53", "remaining_time": "12:29:12", "throughput": 331.67, "total_tokens": 35739040} {"current_steps": 28230, "total_steps": 40000, "loss": 0.0421, "lr": 0.05966398922272492, "epoch": 1.3793516233845553, "percentage": 70.58, "elapsed_time": "1 day, 5:55:56", "remaining_time": "12:28:47", "throughput": 331.73, "total_tokens": 35745600} {"current_steps": 28235, "total_steps": 40000, "loss": 0.0399, "lr": 0.059616971552207236, "epoch": 1.3795959250482497, "percentage": 70.59, "elapsed_time": "1 day, 5:55:59", "remaining_time": "12:28:21", "throughput": 331.78, "total_tokens": 35752128} {"current_steps": 28240, "total_steps": 40000, "loss": 0.0369, "lr": 0.059569967819888305, "epoch": 1.3798402267119438, "percentage": 70.6, "elapsed_time": "1 day, 5:56:02", "remaining_time": "12:27:55", "throughput": 331.82, "total_tokens": 35758368} {"current_steps": 28245, "total_steps": 40000, "loss": 0.0364, "lr": 0.05952297803301681, "epoch": 1.3800845283756382, "percentage": 70.61, "elapsed_time": "1 day, 5:56:05", "remaining_time": "12:27:30", "throughput": 331.87, "total_tokens": 35764736} {"current_steps": 28250, "total_steps": 40000, "loss": 0.0322, "lr": 0.059476002198839056, "epoch": 1.3803288300393326, "percentage": 70.62, "elapsed_time": "1 day, 5:56:09", "remaining_time": "12:27:04", "throughput": 331.92, "total_tokens": 35771008} {"current_steps": 28255, "total_steps": 40000, "loss": 0.0936, "lr": 0.05942904032459935, "epoch": 1.380573131703027, "percentage": 70.64, "elapsed_time": "1 day, 5:56:12", "remaining_time": "12:26:38", "throughput": 331.97, "total_tokens": 35777216} {"current_steps": 28260, "total_steps": 40000, "loss": 0.0516, "lr": 0.05938209241753987, "epoch": 1.3808174333667211, "percentage": 70.65, "elapsed_time": "1 day, 5:56:15", "remaining_time": "12:26:12", "throughput": 332.02, "total_tokens": 35783520} {"current_steps": 28265, "total_steps": 40000, "loss": 0.0593, "lr": 0.05933515848490046, "epoch": 1.3810617350304155, "percentage": 70.66, "elapsed_time": "1 day, 5:56:18", "remaining_time": "12:25:47", "throughput": 332.07, "total_tokens": 35790112} {"current_steps": 28270, "total_steps": 40000, "loss": 0.0735, "lr": 0.059288238533918985, "epoch": 1.38130603669411, "percentage": 70.67, "elapsed_time": "1 day, 5:56:21", "remaining_time": "12:25:21", "throughput": 332.12, "total_tokens": 35796320} {"current_steps": 28275, "total_steps": 40000, "loss": 0.0769, "lr": 0.05924133257183113, "epoch": 1.3815503383578043, "percentage": 70.69, "elapsed_time": "1 day, 5:56:24", "remaining_time": "12:24:55", "throughput": 332.17, "total_tokens": 35802560} {"current_steps": 28280, "total_steps": 40000, "loss": 0.0363, "lr": 0.059194440605870285, "epoch": 1.3817946400214987, "percentage": 70.7, "elapsed_time": "1 day, 5:56:27", "remaining_time": "12:24:30", "throughput": 332.22, "total_tokens": 35809280} {"current_steps": 28285, "total_steps": 40000, "loss": 0.0423, "lr": 0.059147562643267884, "epoch": 1.3820389416851928, "percentage": 70.71, "elapsed_time": "1 day, 5:56:30", "remaining_time": "12:24:04", "throughput": 332.27, "total_tokens": 35815680} {"current_steps": 28290, "total_steps": 40000, "loss": 0.044, "lr": 0.059100698691253055, "epoch": 1.3822832433488872, "percentage": 70.73, "elapsed_time": "1 day, 5:56:33", "remaining_time": "12:23:38", "throughput": 332.32, "total_tokens": 35821888} {"current_steps": 28295, "total_steps": 40000, "loss": 0.0383, "lr": 0.05905384875705273, "epoch": 1.3825275450125816, "percentage": 70.74, "elapsed_time": "1 day, 5:56:36", "remaining_time": "12:23:13", "throughput": 332.37, "total_tokens": 35828512} {"current_steps": 28300, "total_steps": 40000, "loss": 0.0438, "lr": 0.05900701284789189, "epoch": 1.3827718466762757, "percentage": 70.75, "elapsed_time": "1 day, 5:56:40", "remaining_time": "12:22:47", "throughput": 332.42, "total_tokens": 35834592} {"current_steps": 28305, "total_steps": 40000, "loss": 0.0524, "lr": 0.058960190970993115, "epoch": 1.38301614833997, "percentage": 70.76, "elapsed_time": "1 day, 5:56:43", "remaining_time": "12:22:21", "throughput": 332.47, "total_tokens": 35841248} {"current_steps": 28310, "total_steps": 40000, "loss": 0.0389, "lr": 0.058913383133576955, "epoch": 1.3832604500036645, "percentage": 70.78, "elapsed_time": "1 day, 5:56:46", "remaining_time": "12:21:56", "throughput": 332.52, "total_tokens": 35847456} {"current_steps": 28315, "total_steps": 40000, "loss": 0.0847, "lr": 0.05886658934286185, "epoch": 1.3835047516673589, "percentage": 70.79, "elapsed_time": "1 day, 5:56:49", "remaining_time": "12:21:30", "throughput": 332.57, "total_tokens": 35853792} {"current_steps": 28320, "total_steps": 40000, "loss": 0.0669, "lr": 0.058819809606063846, "epoch": 1.3837490533310532, "percentage": 70.8, "elapsed_time": "1 day, 5:56:52", "remaining_time": "12:21:05", "throughput": 332.62, "total_tokens": 35860768} {"current_steps": 28325, "total_steps": 40000, "loss": 0.0275, "lr": 0.05877304393039711, "epoch": 1.3839933549947476, "percentage": 70.81, "elapsed_time": "1 day, 5:56:55", "remaining_time": "12:20:39", "throughput": 332.67, "total_tokens": 35867616} {"current_steps": 28330, "total_steps": 40000, "loss": 0.0479, "lr": 0.05872629232307338, "epoch": 1.3842376566584418, "percentage": 70.83, "elapsed_time": "1 day, 5:56:58", "remaining_time": "12:20:13", "throughput": 332.72, "total_tokens": 35873888} {"current_steps": 28335, "total_steps": 40000, "loss": 0.0742, "lr": 0.05867955479130239, "epoch": 1.3844819583221362, "percentage": 70.84, "elapsed_time": "1 day, 5:57:01", "remaining_time": "12:19:48", "throughput": 332.77, "total_tokens": 35879712} {"current_steps": 28340, "total_steps": 40000, "loss": 0.0416, "lr": 0.058632831342291705, "epoch": 1.3847262599858305, "percentage": 70.85, "elapsed_time": "1 day, 5:57:04", "remaining_time": "12:19:22", "throughput": 332.82, "total_tokens": 35886016} {"current_steps": 28345, "total_steps": 40000, "loss": 0.0514, "lr": 0.05858612198324655, "epoch": 1.3849705616495247, "percentage": 70.86, "elapsed_time": "1 day, 5:57:08", "remaining_time": "12:18:57", "throughput": 332.87, "total_tokens": 35892928} {"current_steps": 28350, "total_steps": 40000, "loss": 0.0567, "lr": 0.05853942672137025, "epoch": 1.385214863313219, "percentage": 70.88, "elapsed_time": "1 day, 5:57:11", "remaining_time": "12:18:31", "throughput": 332.92, "total_tokens": 35899232} {"current_steps": 28355, "total_steps": 40000, "loss": 0.0791, "lr": 0.05849274556386363, "epoch": 1.3854591649769135, "percentage": 70.89, "elapsed_time": "1 day, 5:57:14", "remaining_time": "12:18:05", "throughput": 332.96, "total_tokens": 35904896} {"current_steps": 28360, "total_steps": 40000, "loss": 0.0725, "lr": 0.05844607851792567, "epoch": 1.3857034666406078, "percentage": 70.9, "elapsed_time": "1 day, 5:57:17", "remaining_time": "12:17:40", "throughput": 333.02, "total_tokens": 35911488} {"current_steps": 28365, "total_steps": 40000, "loss": 0.0567, "lr": 0.058399425590752924, "epoch": 1.3859477683043022, "percentage": 70.91, "elapsed_time": "1 day, 5:57:20", "remaining_time": "12:17:14", "throughput": 333.06, "total_tokens": 35917376} {"current_steps": 28370, "total_steps": 40000, "loss": 0.0473, "lr": 0.05835278678953985, "epoch": 1.3861920699679966, "percentage": 70.93, "elapsed_time": "1 day, 5:57:23", "remaining_time": "12:16:49", "throughput": 333.11, "total_tokens": 35923648} {"current_steps": 28375, "total_steps": 40000, "loss": 0.0598, "lr": 0.05830616212147874, "epoch": 1.3864363716316908, "percentage": 70.94, "elapsed_time": "1 day, 5:57:26", "remaining_time": "12:16:23", "throughput": 333.16, "total_tokens": 35930048} {"current_steps": 28380, "total_steps": 40000, "loss": 0.0511, "lr": 0.058259551593759784, "epoch": 1.3866806732953851, "percentage": 70.95, "elapsed_time": "1 day, 5:57:29", "remaining_time": "12:15:58", "throughput": 333.21, "total_tokens": 35936096} {"current_steps": 28385, "total_steps": 40000, "loss": 0.0634, "lr": 0.058212955213570804, "epoch": 1.3869249749590795, "percentage": 70.96, "elapsed_time": "1 day, 5:57:32", "remaining_time": "12:15:32", "throughput": 333.25, "total_tokens": 35942432} {"current_steps": 28390, "total_steps": 40000, "loss": 0.0529, "lr": 0.0581663729880976, "epoch": 1.3871692766227737, "percentage": 70.97, "elapsed_time": "1 day, 5:57:35", "remaining_time": "12:15:07", "throughput": 333.3, "total_tokens": 35948352} {"current_steps": 28395, "total_steps": 40000, "loss": 0.0707, "lr": 0.05811980492452379, "epoch": 1.387413578286468, "percentage": 70.99, "elapsed_time": "1 day, 5:57:38", "remaining_time": "12:14:41", "throughput": 333.35, "total_tokens": 35954464} {"current_steps": 28400, "total_steps": 40000, "loss": 0.0615, "lr": 0.058073251030030644, "epoch": 1.3876578799501624, "percentage": 71.0, "elapsed_time": "1 day, 5:57:41", "remaining_time": "12:14:16", "throughput": 333.4, "total_tokens": 35960608} {"current_steps": 28400, "total_steps": 40000, "eval_loss": 0.06265776604413986, "epoch": 1.3876578799501624, "percentage": 71.0, "elapsed_time": "1 day, 6:08:21", "remaining_time": "12:18:37", "throughput": 331.43, "total_tokens": 35960608} {"current_steps": 28405, "total_steps": 40000, "loss": 0.0581, "lr": 0.05802671131179747, "epoch": 1.3879021816138568, "percentage": 71.01, "elapsed_time": "1 day, 6:08:25", "remaining_time": "12:18:12", "throughput": 331.48, "total_tokens": 35966880} {"current_steps": 28410, "total_steps": 40000, "loss": 0.0395, "lr": 0.057980185777001154, "epoch": 1.3881464832775512, "percentage": 71.03, "elapsed_time": "1 day, 6:08:28", "remaining_time": "12:17:46", "throughput": 331.52, "total_tokens": 35973056} {"current_steps": 28415, "total_steps": 40000, "loss": 0.0595, "lr": 0.057933674432816606, "epoch": 1.3883907849412456, "percentage": 71.04, "elapsed_time": "1 day, 6:08:31", "remaining_time": "12:17:20", "throughput": 331.57, "total_tokens": 35979328} {"current_steps": 28420, "total_steps": 40000, "loss": 0.0385, "lr": 0.05788717728641648, "epoch": 1.3886350866049397, "percentage": 71.05, "elapsed_time": "1 day, 6:08:34", "remaining_time": "12:16:55", "throughput": 331.62, "total_tokens": 35985408} {"current_steps": 28425, "total_steps": 40000, "loss": 0.0803, "lr": 0.057840694344971126, "epoch": 1.388879388268634, "percentage": 71.06, "elapsed_time": "1 day, 6:08:37", "remaining_time": "12:16:29", "throughput": 331.67, "total_tokens": 35991552} {"current_steps": 28430, "total_steps": 40000, "loss": 0.0756, "lr": 0.0577942256156489, "epoch": 1.3891236899323285, "percentage": 71.08, "elapsed_time": "1 day, 6:08:40", "remaining_time": "12:16:04", "throughput": 331.72, "total_tokens": 35998208} {"current_steps": 28435, "total_steps": 40000, "loss": 0.0493, "lr": 0.057747771105615804, "epoch": 1.3893679915960226, "percentage": 71.09, "elapsed_time": "1 day, 6:08:43", "remaining_time": "12:15:38", "throughput": 331.76, "total_tokens": 36004096} {"current_steps": 28440, "total_steps": 40000, "loss": 0.0668, "lr": 0.05770133082203568, "epoch": 1.389612293259717, "percentage": 71.1, "elapsed_time": "1 day, 6:08:46", "remaining_time": "12:15:12", "throughput": 331.81, "total_tokens": 36010816} {"current_steps": 28445, "total_steps": 40000, "loss": 0.0941, "lr": 0.0576549047720703, "epoch": 1.3898565949234114, "percentage": 71.11, "elapsed_time": "1 day, 6:08:49", "remaining_time": "12:14:47", "throughput": 331.86, "total_tokens": 36017152} {"current_steps": 28450, "total_steps": 40000, "loss": 0.0397, "lr": 0.05760849296287902, "epoch": 1.3901008965871058, "percentage": 71.12, "elapsed_time": "1 day, 6:08:53", "remaining_time": "12:14:21", "throughput": 331.92, "total_tokens": 36023808} {"current_steps": 28455, "total_steps": 40000, "loss": 0.0545, "lr": 0.05756209540161919, "epoch": 1.3903451982508002, "percentage": 71.14, "elapsed_time": "1 day, 6:08:56", "remaining_time": "12:13:56", "throughput": 331.96, "total_tokens": 36030144} {"current_steps": 28460, "total_steps": 40000, "loss": 0.0522, "lr": 0.05751571209544595, "epoch": 1.3905894999144945, "percentage": 71.15, "elapsed_time": "1 day, 6:08:59", "remaining_time": "12:13:30", "throughput": 332.01, "total_tokens": 36036480} {"current_steps": 28465, "total_steps": 40000, "loss": 0.0283, "lr": 0.057469343051512085, "epoch": 1.3908338015781887, "percentage": 71.16, "elapsed_time": "1 day, 6:09:02", "remaining_time": "12:13:05", "throughput": 332.06, "total_tokens": 36042816} {"current_steps": 28470, "total_steps": 40000, "loss": 0.0672, "lr": 0.057422988276968324, "epoch": 1.391078103241883, "percentage": 71.17, "elapsed_time": "1 day, 6:09:05", "remaining_time": "12:12:39", "throughput": 332.11, "total_tokens": 36048928} {"current_steps": 28475, "total_steps": 40000, "loss": 0.0755, "lr": 0.05737664777896323, "epoch": 1.3913224049055775, "percentage": 71.19, "elapsed_time": "1 day, 6:09:08", "remaining_time": "12:12:14", "throughput": 332.16, "total_tokens": 36055168} {"current_steps": 28480, "total_steps": 40000, "loss": 0.034, "lr": 0.057330321564642975, "epoch": 1.3915667065692716, "percentage": 71.2, "elapsed_time": "1 day, 6:09:11", "remaining_time": "12:11:48", "throughput": 332.21, "total_tokens": 36061792} {"current_steps": 28485, "total_steps": 40000, "loss": 0.1, "lr": 0.05728400964115174, "epoch": 1.391811008232966, "percentage": 71.21, "elapsed_time": "1 day, 6:09:14", "remaining_time": "12:11:23", "throughput": 332.26, "total_tokens": 36068032} {"current_steps": 28490, "total_steps": 40000, "loss": 0.0639, "lr": 0.057237712015631305, "epoch": 1.3920553098966604, "percentage": 71.23, "elapsed_time": "1 day, 6:09:17", "remaining_time": "12:10:57", "throughput": 332.31, "total_tokens": 36074336} {"current_steps": 28495, "total_steps": 40000, "loss": 0.0992, "lr": 0.057191428695221425, "epoch": 1.3922996115603548, "percentage": 71.24, "elapsed_time": "1 day, 6:09:20", "remaining_time": "12:10:32", "throughput": 332.35, "total_tokens": 36080608} {"current_steps": 28500, "total_steps": 40000, "loss": 0.0619, "lr": 0.05714515968705958, "epoch": 1.3925439132240491, "percentage": 71.25, "elapsed_time": "1 day, 6:09:24", "remaining_time": "12:10:06", "throughput": 332.4, "total_tokens": 36087200} {"current_steps": 28505, "total_steps": 40000, "loss": 0.0715, "lr": 0.05709890499828099, "epoch": 1.3927882148877435, "percentage": 71.26, "elapsed_time": "1 day, 6:09:27", "remaining_time": "12:09:41", "throughput": 332.45, "total_tokens": 36093568} {"current_steps": 28510, "total_steps": 40000, "loss": 0.0513, "lr": 0.05705266463601868, "epoch": 1.3930325165514377, "percentage": 71.28, "elapsed_time": "1 day, 6:09:30", "remaining_time": "12:09:15", "throughput": 332.5, "total_tokens": 36099712} {"current_steps": 28515, "total_steps": 40000, "loss": 0.0673, "lr": 0.057006438607403565, "epoch": 1.393276818215132, "percentage": 71.29, "elapsed_time": "1 day, 6:09:33", "remaining_time": "12:08:50", "throughput": 332.55, "total_tokens": 36106176} {"current_steps": 28520, "total_steps": 40000, "loss": 0.0512, "lr": 0.056960226919564205, "epoch": 1.3935211198788264, "percentage": 71.3, "elapsed_time": "1 day, 6:09:36", "remaining_time": "12:08:24", "throughput": 332.6, "total_tokens": 36112576} {"current_steps": 28525, "total_steps": 40000, "loss": 0.0397, "lr": 0.05691402957962713, "epoch": 1.3937654215425206, "percentage": 71.31, "elapsed_time": "1 day, 6:09:39", "remaining_time": "12:07:59", "throughput": 332.65, "total_tokens": 36119008} {"current_steps": 28530, "total_steps": 40000, "loss": 0.0561, "lr": 0.05686784659471642, "epoch": 1.394009723206215, "percentage": 71.33, "elapsed_time": "1 day, 6:09:42", "remaining_time": "12:07:33", "throughput": 332.7, "total_tokens": 36125184} {"current_steps": 28535, "total_steps": 40000, "loss": 0.0511, "lr": 0.056821677971954136, "epoch": 1.3942540248699093, "percentage": 71.34, "elapsed_time": "1 day, 6:09:45", "remaining_time": "12:07:08", "throughput": 332.75, "total_tokens": 36131648} {"current_steps": 28540, "total_steps": 40000, "loss": 0.0704, "lr": 0.05677552371846012, "epoch": 1.3944983265336037, "percentage": 71.35, "elapsed_time": "1 day, 6:09:48", "remaining_time": "12:06:42", "throughput": 332.8, "total_tokens": 36137856} {"current_steps": 28545, "total_steps": 40000, "loss": 0.0663, "lr": 0.05672938384135182, "epoch": 1.394742628197298, "percentage": 71.36, "elapsed_time": "1 day, 6:09:51", "remaining_time": "12:06:17", "throughput": 332.85, "total_tokens": 36144320} {"current_steps": 28550, "total_steps": 40000, "loss": 0.0675, "lr": 0.05668325834774465, "epoch": 1.3949869298609925, "percentage": 71.38, "elapsed_time": "1 day, 6:09:54", "remaining_time": "12:05:52", "throughput": 332.89, "total_tokens": 36150368} {"current_steps": 28555, "total_steps": 40000, "loss": 0.0549, "lr": 0.05663714724475177, "epoch": 1.3952312315246866, "percentage": 71.39, "elapsed_time": "1 day, 6:09:58", "remaining_time": "12:05:26", "throughput": 332.94, "total_tokens": 36156544} {"current_steps": 28560, "total_steps": 40000, "loss": 0.0614, "lr": 0.05659105053948403, "epoch": 1.395475533188381, "percentage": 71.4, "elapsed_time": "1 day, 6:10:01", "remaining_time": "12:05:01", "throughput": 332.99, "total_tokens": 36163136} {"current_steps": 28565, "total_steps": 40000, "loss": 0.0535, "lr": 0.056544968239050176, "epoch": 1.3957198348520754, "percentage": 71.41, "elapsed_time": "1 day, 6:10:04", "remaining_time": "12:04:36", "throughput": 333.05, "total_tokens": 36170304} {"current_steps": 28570, "total_steps": 40000, "loss": 0.0548, "lr": 0.056498900350556616, "epoch": 1.3959641365157696, "percentage": 71.43, "elapsed_time": "1 day, 6:10:07", "remaining_time": "12:04:10", "throughput": 333.09, "total_tokens": 36176448} {"current_steps": 28575, "total_steps": 40000, "loss": 0.07, "lr": 0.05645284688110766, "epoch": 1.396208438179464, "percentage": 71.44, "elapsed_time": "1 day, 6:10:10", "remaining_time": "12:03:45", "throughput": 333.14, "total_tokens": 36182528} {"current_steps": 28580, "total_steps": 40000, "loss": 0.0482, "lr": 0.05640680783780532, "epoch": 1.3964527398431583, "percentage": 71.45, "elapsed_time": "1 day, 6:10:13", "remaining_time": "12:03:19", "throughput": 333.19, "total_tokens": 36189472} {"current_steps": 28585, "total_steps": 40000, "loss": 0.066, "lr": 0.056360783227749324, "epoch": 1.3966970415068527, "percentage": 71.46, "elapsed_time": "1 day, 6:10:16", "remaining_time": "12:02:54", "throughput": 333.24, "total_tokens": 36195680} {"current_steps": 28590, "total_steps": 40000, "loss": 0.0427, "lr": 0.05631477305803728, "epoch": 1.396941343170547, "percentage": 71.47, "elapsed_time": "1 day, 6:10:19", "remaining_time": "12:02:29", "throughput": 333.29, "total_tokens": 36202016} {"current_steps": 28595, "total_steps": 40000, "loss": 0.0571, "lr": 0.05626877733576462, "epoch": 1.3971856448342415, "percentage": 71.49, "elapsed_time": "1 day, 6:10:23", "remaining_time": "12:02:03", "throughput": 333.34, "total_tokens": 36208512} {"current_steps": 28600, "total_steps": 40000, "loss": 0.0507, "lr": 0.05622279606802435, "epoch": 1.3974299464979356, "percentage": 71.5, "elapsed_time": "1 day, 6:10:26", "remaining_time": "12:01:38", "throughput": 333.39, "total_tokens": 36214944} {"current_steps": 28600, "total_steps": 40000, "eval_loss": 0.062125883996486664, "epoch": 1.3974299464979356, "percentage": 71.5, "elapsed_time": "1 day, 6:21:07", "remaining_time": "12:05:54", "throughput": 331.43, "total_tokens": 36214944} {"current_steps": 28605, "total_steps": 40000, "loss": 0.0546, "lr": 0.05617682926190744, "epoch": 1.39767424816163, "percentage": 71.51, "elapsed_time": "1 day, 6:21:11", "remaining_time": "12:05:29", "throughput": 331.48, "total_tokens": 36221216} {"current_steps": 28610, "total_steps": 40000, "loss": 0.0287, "lr": 0.05613087692450248, "epoch": 1.3979185498253244, "percentage": 71.53, "elapsed_time": "1 day, 6:21:14", "remaining_time": "12:05:03", "throughput": 331.53, "total_tokens": 36227616} {"current_steps": 28615, "total_steps": 40000, "loss": 0.0333, "lr": 0.05608493906289592, "epoch": 1.3981628514890185, "percentage": 71.54, "elapsed_time": "1 day, 6:21:17", "remaining_time": "12:04:38", "throughput": 331.57, "total_tokens": 36233600} {"current_steps": 28620, "total_steps": 40000, "loss": 0.049, "lr": 0.05603901568417201, "epoch": 1.398407153152713, "percentage": 71.55, "elapsed_time": "1 day, 6:21:20", "remaining_time": "12:04:12", "throughput": 331.62, "total_tokens": 36239776} {"current_steps": 28625, "total_steps": 40000, "loss": 0.0531, "lr": 0.055993106795412625, "epoch": 1.3986514548164073, "percentage": 71.56, "elapsed_time": "1 day, 6:21:23", "remaining_time": "12:03:47", "throughput": 331.67, "total_tokens": 36245984} {"current_steps": 28630, "total_steps": 40000, "loss": 0.0825, "lr": 0.05594721240369759, "epoch": 1.3988957564801017, "percentage": 71.58, "elapsed_time": "1 day, 6:21:26", "remaining_time": "12:03:21", "throughput": 331.71, "total_tokens": 36252000} {"current_steps": 28635, "total_steps": 40000, "loss": 0.0783, "lr": 0.055901332516104296, "epoch": 1.399140058143796, "percentage": 71.59, "elapsed_time": "1 day, 6:21:29", "remaining_time": "12:02:56", "throughput": 331.76, "total_tokens": 36257952} {"current_steps": 28640, "total_steps": 40000, "loss": 0.0424, "lr": 0.05585546713970804, "epoch": 1.3993843598074902, "percentage": 71.6, "elapsed_time": "1 day, 6:21:32", "remaining_time": "12:02:30", "throughput": 331.81, "total_tokens": 36264192} {"current_steps": 28645, "total_steps": 40000, "loss": 0.1271, "lr": 0.05580961628158189, "epoch": 1.3996286614711846, "percentage": 71.61, "elapsed_time": "1 day, 6:21:35", "remaining_time": "12:02:05", "throughput": 331.86, "total_tokens": 36270528} {"current_steps": 28650, "total_steps": 40000, "loss": 0.0628, "lr": 0.05576377994879659, "epoch": 1.399872963134879, "percentage": 71.62, "elapsed_time": "1 day, 6:21:38", "remaining_time": "12:01:39", "throughput": 331.9, "total_tokens": 36276768} {"current_steps": 28655, "total_steps": 40000, "loss": 0.0733, "lr": 0.05571795814842063, "epoch": 1.4001172647985733, "percentage": 71.64, "elapsed_time": "1 day, 6:21:42", "remaining_time": "12:01:14", "throughput": 331.96, "total_tokens": 36283488} {"current_steps": 28660, "total_steps": 40000, "loss": 0.0688, "lr": 0.05567215088752037, "epoch": 1.4003615664622675, "percentage": 71.65, "elapsed_time": "1 day, 6:21:45", "remaining_time": "12:00:49", "throughput": 332.01, "total_tokens": 36290208} {"current_steps": 28665, "total_steps": 40000, "loss": 0.0562, "lr": 0.05562635817315981, "epoch": 1.4006058681259619, "percentage": 71.66, "elapsed_time": "1 day, 6:21:48", "remaining_time": "12:00:23", "throughput": 332.06, "total_tokens": 36296480} {"current_steps": 28670, "total_steps": 40000, "loss": 0.0812, "lr": 0.05558058001240083, "epoch": 1.4008501697896563, "percentage": 71.67, "elapsed_time": "1 day, 6:21:51", "remaining_time": "11:59:58", "throughput": 332.11, "total_tokens": 36303040} {"current_steps": 28675, "total_steps": 40000, "loss": 0.0497, "lr": 0.055534816412302915, "epoch": 1.4010944714533506, "percentage": 71.69, "elapsed_time": "1 day, 6:21:54", "remaining_time": "11:59:33", "throughput": 332.15, "total_tokens": 36309216} {"current_steps": 28680, "total_steps": 40000, "loss": 0.0467, "lr": 0.055489067379923436, "epoch": 1.401338773117045, "percentage": 71.7, "elapsed_time": "1 day, 6:21:57", "remaining_time": "11:59:07", "throughput": 332.2, "total_tokens": 36315392} {"current_steps": 28685, "total_steps": 40000, "loss": 0.0404, "lr": 0.055443332922317505, "epoch": 1.4015830747807392, "percentage": 71.71, "elapsed_time": "1 day, 6:22:00", "remaining_time": "11:58:42", "throughput": 332.25, "total_tokens": 36321792} {"current_steps": 28690, "total_steps": 40000, "loss": 0.0516, "lr": 0.055397613046537876, "epoch": 1.4018273764444336, "percentage": 71.73, "elapsed_time": "1 day, 6:22:03", "remaining_time": "11:58:16", "throughput": 332.3, "total_tokens": 36328064} {"current_steps": 28695, "total_steps": 40000, "loss": 0.0837, "lr": 0.055351907759635145, "epoch": 1.402071678108128, "percentage": 71.74, "elapsed_time": "1 day, 6:22:06", "remaining_time": "11:57:51", "throughput": 332.35, "total_tokens": 36334496} {"current_steps": 28700, "total_steps": 40000, "loss": 0.0402, "lr": 0.05530621706865772, "epoch": 1.4023159797718223, "percentage": 71.75, "elapsed_time": "1 day, 6:22:09", "remaining_time": "11:57:26", "throughput": 332.4, "total_tokens": 36340800} {"current_steps": 28705, "total_steps": 40000, "loss": 0.0402, "lr": 0.055260540980651564, "epoch": 1.4025602814355165, "percentage": 71.76, "elapsed_time": "1 day, 6:22:12", "remaining_time": "11:57:00", "throughput": 332.44, "total_tokens": 36346720} {"current_steps": 28710, "total_steps": 40000, "loss": 0.0371, "lr": 0.05521487950266062, "epoch": 1.4028045830992109, "percentage": 71.78, "elapsed_time": "1 day, 6:22:15", "remaining_time": "11:56:35", "throughput": 332.49, "total_tokens": 36352704} {"current_steps": 28715, "total_steps": 40000, "loss": 0.0799, "lr": 0.055169232641726344, "epoch": 1.4030488847629052, "percentage": 71.79, "elapsed_time": "1 day, 6:22:18", "remaining_time": "11:56:10", "throughput": 332.53, "total_tokens": 36358944} {"current_steps": 28720, "total_steps": 40000, "loss": 0.0641, "lr": 0.055123600404888166, "epoch": 1.4032931864265996, "percentage": 71.8, "elapsed_time": "1 day, 6:22:21", "remaining_time": "11:55:44", "throughput": 332.58, "total_tokens": 36364704} {"current_steps": 28725, "total_steps": 40000, "loss": 0.0362, "lr": 0.05507798279918309, "epoch": 1.403537488090294, "percentage": 71.81, "elapsed_time": "1 day, 6:22:25", "remaining_time": "11:55:19", "throughput": 332.63, "total_tokens": 36371552} {"current_steps": 28730, "total_steps": 40000, "loss": 0.0367, "lr": 0.0550323798316459, "epoch": 1.4037817897539882, "percentage": 71.83, "elapsed_time": "1 day, 6:22:28", "remaining_time": "11:54:54", "throughput": 332.68, "total_tokens": 36378112} {"current_steps": 28735, "total_steps": 40000, "loss": 0.0487, "lr": 0.05498679150930916, "epoch": 1.4040260914176825, "percentage": 71.84, "elapsed_time": "1 day, 6:22:31", "remaining_time": "11:54:29", "throughput": 332.73, "total_tokens": 36384512} {"current_steps": 28740, "total_steps": 40000, "loss": 0.0493, "lr": 0.05494121783920323, "epoch": 1.404270393081377, "percentage": 71.85, "elapsed_time": "1 day, 6:22:34", "remaining_time": "11:54:03", "throughput": 332.78, "total_tokens": 36391168} {"current_steps": 28745, "total_steps": 40000, "loss": 0.0649, "lr": 0.05489565882835605, "epoch": 1.4045146947450713, "percentage": 71.86, "elapsed_time": "1 day, 6:22:37", "remaining_time": "11:53:38", "throughput": 332.83, "total_tokens": 36397696} {"current_steps": 28750, "total_steps": 40000, "loss": 0.0626, "lr": 0.05485011448379348, "epoch": 1.4047589964087654, "percentage": 71.88, "elapsed_time": "1 day, 6:22:40", "remaining_time": "11:53:13", "throughput": 332.88, "total_tokens": 36403680} {"current_steps": 28755, "total_steps": 40000, "loss": 0.051, "lr": 0.05480458481253893, "epoch": 1.4050032980724598, "percentage": 71.89, "elapsed_time": "1 day, 6:22:43", "remaining_time": "11:52:48", "throughput": 332.93, "total_tokens": 36410368} {"current_steps": 28760, "total_steps": 40000, "loss": 0.0572, "lr": 0.054759069821613715, "epoch": 1.4052475997361542, "percentage": 71.9, "elapsed_time": "1 day, 6:22:46", "remaining_time": "11:52:22", "throughput": 332.98, "total_tokens": 36416672} {"current_steps": 28765, "total_steps": 40000, "loss": 0.0633, "lr": 0.05471356951803683, "epoch": 1.4054919013998486, "percentage": 71.91, "elapsed_time": "1 day, 6:22:49", "remaining_time": "11:51:57", "throughput": 333.02, "total_tokens": 36422784} {"current_steps": 28770, "total_steps": 40000, "loss": 0.0527, "lr": 0.054668083908824945, "epoch": 1.405736203063543, "percentage": 71.92, "elapsed_time": "1 day, 6:22:53", "remaining_time": "11:51:32", "throughput": 333.07, "total_tokens": 36428768} {"current_steps": 28775, "total_steps": 40000, "loss": 0.0722, "lr": 0.054622613000992526, "epoch": 1.4059805047272371, "percentage": 71.94, "elapsed_time": "1 day, 6:22:56", "remaining_time": "11:51:07", "throughput": 333.12, "total_tokens": 36435424} {"current_steps": 28780, "total_steps": 40000, "loss": 0.028, "lr": 0.05457715680155182, "epoch": 1.4062248063909315, "percentage": 71.95, "elapsed_time": "1 day, 6:22:59", "remaining_time": "11:50:41", "throughput": 333.17, "total_tokens": 36441536} {"current_steps": 28785, "total_steps": 40000, "loss": 0.08, "lr": 0.05453171531751265, "epoch": 1.4064691080546259, "percentage": 71.96, "elapsed_time": "1 day, 6:23:02", "remaining_time": "11:50:16", "throughput": 333.21, "total_tokens": 36447776} {"current_steps": 28790, "total_steps": 40000, "loss": 0.0722, "lr": 0.05448628855588276, "epoch": 1.4067134097183203, "percentage": 71.97, "elapsed_time": "1 day, 6:23:05", "remaining_time": "11:49:51", "throughput": 333.26, "total_tokens": 36453760} {"current_steps": 28795, "total_steps": 40000, "loss": 0.0853, "lr": 0.05444087652366746, "epoch": 1.4069577113820144, "percentage": 71.99, "elapsed_time": "1 day, 6:23:08", "remaining_time": "11:49:26", "throughput": 333.31, "total_tokens": 36459872} {"current_steps": 28800, "total_steps": 40000, "loss": 0.0612, "lr": 0.05439547922786984, "epoch": 1.4072020130457088, "percentage": 72.0, "elapsed_time": "1 day, 6:23:11", "remaining_time": "11:49:01", "throughput": 333.36, "total_tokens": 36466336} {"current_steps": 28800, "total_steps": 40000, "eval_loss": 0.06246357411146164, "epoch": 1.4072020130457088, "percentage": 72.0, "elapsed_time": "1 day, 6:33:51", "remaining_time": "11:53:10", "throughput": 331.42, "total_tokens": 36466336} {"current_steps": 28805, "total_steps": 40000, "loss": 0.0569, "lr": 0.0543500966754908, "epoch": 1.4074463147094032, "percentage": 72.01, "elapsed_time": "1 day, 6:33:55", "remaining_time": "11:52:45", "throughput": 331.46, "total_tokens": 36472864} {"current_steps": 28810, "total_steps": 40000, "loss": 0.0677, "lr": 0.05430472887352882, "epoch": 1.4076906163730976, "percentage": 72.02, "elapsed_time": "1 day, 6:33:58", "remaining_time": "11:52:19", "throughput": 331.51, "total_tokens": 36479424} {"current_steps": 28815, "total_steps": 40000, "loss": 0.0505, "lr": 0.05425937582898023, "epoch": 1.407934918036792, "percentage": 72.04, "elapsed_time": "1 day, 6:34:02", "remaining_time": "11:51:54", "throughput": 331.56, "total_tokens": 36485632} {"current_steps": 28820, "total_steps": 40000, "loss": 0.0768, "lr": 0.054214037548839085, "epoch": 1.408179219700486, "percentage": 72.05, "elapsed_time": "1 day, 6:34:05", "remaining_time": "11:51:29", "throughput": 331.61, "total_tokens": 36491584} {"current_steps": 28825, "total_steps": 40000, "loss": 0.0464, "lr": 0.05416871404009703, "epoch": 1.4084235213641805, "percentage": 72.06, "elapsed_time": "1 day, 6:34:08", "remaining_time": "11:51:03", "throughput": 331.66, "total_tokens": 36498176} {"current_steps": 28830, "total_steps": 40000, "loss": 0.0551, "lr": 0.054123405309743605, "epoch": 1.4086678230278749, "percentage": 72.08, "elapsed_time": "1 day, 6:34:11", "remaining_time": "11:50:38", "throughput": 331.7, "total_tokens": 36504416} {"current_steps": 28835, "total_steps": 40000, "loss": 0.0402, "lr": 0.0540781113647659, "epoch": 1.408912124691569, "percentage": 72.09, "elapsed_time": "1 day, 6:34:14", "remaining_time": "11:50:13", "throughput": 331.75, "total_tokens": 36510592} {"current_steps": 28840, "total_steps": 40000, "loss": 0.0687, "lr": 0.054032832212148836, "epoch": 1.4091564263552634, "percentage": 72.1, "elapsed_time": "1 day, 6:34:17", "remaining_time": "11:49:48", "throughput": 331.8, "total_tokens": 36517216} {"current_steps": 28845, "total_steps": 40000, "loss": 0.067, "lr": 0.0539875678588751, "epoch": 1.4094007280189578, "percentage": 72.11, "elapsed_time": "1 day, 6:34:20", "remaining_time": "11:49:22", "throughput": 331.85, "total_tokens": 36523648} {"current_steps": 28850, "total_steps": 40000, "loss": 0.0569, "lr": 0.05394231831192492, "epoch": 1.4096450296826522, "percentage": 72.12, "elapsed_time": "1 day, 6:34:23", "remaining_time": "11:48:57", "throughput": 331.9, "total_tokens": 36529664} {"current_steps": 28855, "total_steps": 40000, "loss": 0.0805, "lr": 0.05389708357827639, "epoch": 1.4098893313463465, "percentage": 72.14, "elapsed_time": "1 day, 6:34:26", "remaining_time": "11:48:32", "throughput": 331.94, "total_tokens": 36536096} {"current_steps": 28860, "total_steps": 40000, "loss": 0.0288, "lr": 0.05385186366490533, "epoch": 1.410133633010041, "percentage": 72.15, "elapsed_time": "1 day, 6:34:29", "remaining_time": "11:48:07", "throughput": 332.0, "total_tokens": 36542816} {"current_steps": 28865, "total_steps": 40000, "loss": 0.0524, "lr": 0.053806658578785166, "epoch": 1.410377934673735, "percentage": 72.16, "elapsed_time": "1 day, 6:34:32", "remaining_time": "11:47:41", "throughput": 332.04, "total_tokens": 36548960} {"current_steps": 28870, "total_steps": 40000, "loss": 0.0611, "lr": 0.05376146832688705, "epoch": 1.4106222363374294, "percentage": 72.17, "elapsed_time": "1 day, 6:34:35", "remaining_time": "11:47:16", "throughput": 332.09, "total_tokens": 36555136} {"current_steps": 28875, "total_steps": 40000, "loss": 0.07, "lr": 0.053716292916179964, "epoch": 1.4108665380011238, "percentage": 72.19, "elapsed_time": "1 day, 6:34:39", "remaining_time": "11:46:51", "throughput": 332.14, "total_tokens": 36561664} {"current_steps": 28880, "total_steps": 40000, "loss": 0.063, "lr": 0.05367113235363045, "epoch": 1.411110839664818, "percentage": 72.2, "elapsed_time": "1 day, 6:34:42", "remaining_time": "11:46:26", "throughput": 332.18, "total_tokens": 36567520} {"current_steps": 28885, "total_steps": 40000, "loss": 0.0407, "lr": 0.05362598664620289, "epoch": 1.4113551413285124, "percentage": 72.21, "elapsed_time": "1 day, 6:34:45", "remaining_time": "11:46:00", "throughput": 332.23, "total_tokens": 36573824} {"current_steps": 28890, "total_steps": 40000, "loss": 0.0679, "lr": 0.053580855800859285, "epoch": 1.4115994429922067, "percentage": 72.22, "elapsed_time": "1 day, 6:34:48", "remaining_time": "11:45:35", "throughput": 332.28, "total_tokens": 36580384} {"current_steps": 28895, "total_steps": 40000, "loss": 0.0518, "lr": 0.05353573982455938, "epoch": 1.4118437446559011, "percentage": 72.24, "elapsed_time": "1 day, 6:34:51", "remaining_time": "11:45:10", "throughput": 332.33, "total_tokens": 36586880} {"current_steps": 28900, "total_steps": 40000, "loss": 0.0436, "lr": 0.053490638724260686, "epoch": 1.4120880463195955, "percentage": 72.25, "elapsed_time": "1 day, 6:34:54", "remaining_time": "11:44:45", "throughput": 332.38, "total_tokens": 36593024} {"current_steps": 28905, "total_steps": 40000, "loss": 0.0594, "lr": 0.05344555250691827, "epoch": 1.4123323479832899, "percentage": 72.26, "elapsed_time": "1 day, 6:34:57", "remaining_time": "11:44:20", "throughput": 332.43, "total_tokens": 36599680} {"current_steps": 28910, "total_steps": 40000, "loss": 0.0716, "lr": 0.053400481179485086, "epoch": 1.412576649646984, "percentage": 72.28, "elapsed_time": "1 day, 6:35:00", "remaining_time": "11:43:55", "throughput": 332.48, "total_tokens": 36605792} {"current_steps": 28915, "total_steps": 40000, "loss": 0.046, "lr": 0.05335542474891159, "epoch": 1.4128209513106784, "percentage": 72.29, "elapsed_time": "1 day, 6:35:03", "remaining_time": "11:43:29", "throughput": 332.53, "total_tokens": 36612448} {"current_steps": 28920, "total_steps": 40000, "loss": 0.0414, "lr": 0.053310383222146124, "epoch": 1.4130652529743728, "percentage": 72.3, "elapsed_time": "1 day, 6:35:06", "remaining_time": "11:43:04", "throughput": 332.57, "total_tokens": 36618656} {"current_steps": 28925, "total_steps": 40000, "loss": 0.0288, "lr": 0.053265356606134684, "epoch": 1.413309554638067, "percentage": 72.31, "elapsed_time": "1 day, 6:35:10", "remaining_time": "11:42:39", "throughput": 332.62, "total_tokens": 36625216} {"current_steps": 28930, "total_steps": 40000, "loss": 0.0613, "lr": 0.053220344907820856, "epoch": 1.4135538563017613, "percentage": 72.32, "elapsed_time": "1 day, 6:35:13", "remaining_time": "11:42:14", "throughput": 332.67, "total_tokens": 36631168} {"current_steps": 28935, "total_steps": 40000, "loss": 0.0738, "lr": 0.05317534813414608, "epoch": 1.4137981579654557, "percentage": 72.34, "elapsed_time": "1 day, 6:35:16", "remaining_time": "11:41:49", "throughput": 332.72, "total_tokens": 36637888} {"current_steps": 28940, "total_steps": 40000, "loss": 0.0697, "lr": 0.05313036629204942, "epoch": 1.41404245962915, "percentage": 72.35, "elapsed_time": "1 day, 6:35:19", "remaining_time": "11:41:24", "throughput": 332.77, "total_tokens": 36643840} {"current_steps": 28945, "total_steps": 40000, "loss": 0.0609, "lr": 0.05308539938846756, "epoch": 1.4142867612928445, "percentage": 72.36, "elapsed_time": "1 day, 6:35:22", "remaining_time": "11:40:59", "throughput": 332.81, "total_tokens": 36650208} {"current_steps": 28950, "total_steps": 40000, "loss": 0.0608, "lr": 0.05304044743033507, "epoch": 1.4145310629565389, "percentage": 72.38, "elapsed_time": "1 day, 6:35:25", "remaining_time": "11:40:34", "throughput": 332.87, "total_tokens": 36657280} {"current_steps": 28955, "total_steps": 40000, "loss": 0.0513, "lr": 0.05299551042458401, "epoch": 1.414775364620233, "percentage": 72.39, "elapsed_time": "1 day, 6:35:28", "remaining_time": "11:40:08", "throughput": 332.91, "total_tokens": 36663136} {"current_steps": 28960, "total_steps": 40000, "loss": 0.0841, "lr": 0.052950588378144266, "epoch": 1.4150196662839274, "percentage": 72.4, "elapsed_time": "1 day, 6:35:31", "remaining_time": "11:39:43", "throughput": 332.96, "total_tokens": 36669408} {"current_steps": 28965, "total_steps": 40000, "loss": 0.0714, "lr": 0.052905681297943465, "epoch": 1.4152639679476218, "percentage": 72.41, "elapsed_time": "1 day, 6:35:34", "remaining_time": "11:39:18", "throughput": 333.01, "total_tokens": 36676096} {"current_steps": 28970, "total_steps": 40000, "loss": 0.0654, "lr": 0.0528607891909067, "epoch": 1.415508269611316, "percentage": 72.42, "elapsed_time": "1 day, 6:35:37", "remaining_time": "11:38:53", "throughput": 333.06, "total_tokens": 36681920} {"current_steps": 28975, "total_steps": 40000, "loss": 0.0535, "lr": 0.05281591206395697, "epoch": 1.4157525712750103, "percentage": 72.44, "elapsed_time": "1 day, 6:35:40", "remaining_time": "11:38:28", "throughput": 333.1, "total_tokens": 36687968} {"current_steps": 28980, "total_steps": 40000, "loss": 0.0478, "lr": 0.05277104992401496, "epoch": 1.4159968729387047, "percentage": 72.45, "elapsed_time": "1 day, 6:35:43", "remaining_time": "11:38:03", "throughput": 333.16, "total_tokens": 36695008} {"current_steps": 28985, "total_steps": 40000, "loss": 0.0568, "lr": 0.05272620277799884, "epoch": 1.416241174602399, "percentage": 72.46, "elapsed_time": "1 day, 6:35:46", "remaining_time": "11:37:38", "throughput": 333.2, "total_tokens": 36701184} {"current_steps": 28990, "total_steps": 40000, "loss": 0.0892, "lr": 0.05268137063282473, "epoch": 1.4164854762660934, "percentage": 72.47, "elapsed_time": "1 day, 6:35:49", "remaining_time": "11:37:13", "throughput": 333.25, "total_tokens": 36707488} {"current_steps": 28995, "total_steps": 40000, "loss": 0.0519, "lr": 0.0526365534954062, "epoch": 1.4167297779297878, "percentage": 72.49, "elapsed_time": "1 day, 6:35:53", "remaining_time": "11:36:48", "throughput": 333.3, "total_tokens": 36713856} {"current_steps": 29000, "total_steps": 40000, "loss": 0.0536, "lr": 0.052591751372654656, "epoch": 1.416974079593482, "percentage": 72.5, "elapsed_time": "1 day, 6:35:56", "remaining_time": "11:36:23", "throughput": 333.35, "total_tokens": 36720160} {"current_steps": 29000, "total_steps": 40000, "eval_loss": 0.06297968327999115, "epoch": 1.416974079593482, "percentage": 72.5, "elapsed_time": "1 day, 6:46:36", "remaining_time": "11:40:26", "throughput": 331.42, "total_tokens": 36720160} {"current_steps": 29005, "total_steps": 40000, "loss": 0.0546, "lr": 0.05254696427147921, "epoch": 1.4172183812571764, "percentage": 72.51, "elapsed_time": "1 day, 6:46:41", "remaining_time": "11:40:01", "throughput": 331.46, "total_tokens": 36726080} {"current_steps": 29010, "total_steps": 40000, "loss": 0.0674, "lr": 0.052502192198786546, "epoch": 1.4174626829208707, "percentage": 72.52, "elapsed_time": "1 day, 6:46:44", "remaining_time": "11:39:36", "throughput": 331.51, "total_tokens": 36732288} {"current_steps": 29015, "total_steps": 40000, "loss": 0.0712, "lr": 0.05245743516148103, "epoch": 1.417706984584565, "percentage": 72.54, "elapsed_time": "1 day, 6:46:47", "remaining_time": "11:39:11", "throughput": 331.56, "total_tokens": 36738816} {"current_steps": 29020, "total_steps": 40000, "loss": 0.0735, "lr": 0.05241269316646486, "epoch": 1.4179512862482593, "percentage": 72.55, "elapsed_time": "1 day, 6:46:50", "remaining_time": "11:38:46", "throughput": 331.6, "total_tokens": 36745056} {"current_steps": 29025, "total_steps": 40000, "loss": 0.0537, "lr": 0.052367966220637725, "epoch": 1.4181955879119537, "percentage": 72.56, "elapsed_time": "1 day, 6:46:53", "remaining_time": "11:38:21", "throughput": 331.65, "total_tokens": 36751552} {"current_steps": 29030, "total_steps": 40000, "loss": 0.0387, "lr": 0.05232325433089716, "epoch": 1.418439889575648, "percentage": 72.58, "elapsed_time": "1 day, 6:46:56", "remaining_time": "11:37:55", "throughput": 331.7, "total_tokens": 36757440} {"current_steps": 29035, "total_steps": 40000, "loss": 0.0567, "lr": 0.052278557504138214, "epoch": 1.4186841912393424, "percentage": 72.59, "elapsed_time": "1 day, 6:46:59", "remaining_time": "11:37:30", "throughput": 331.74, "total_tokens": 36763392} {"current_steps": 29040, "total_steps": 40000, "loss": 0.0653, "lr": 0.05223387574725372, "epoch": 1.4189284929030368, "percentage": 72.6, "elapsed_time": "1 day, 6:47:02", "remaining_time": "11:37:05", "throughput": 331.78, "total_tokens": 36769280} {"current_steps": 29045, "total_steps": 40000, "loss": 0.0565, "lr": 0.05218920906713428, "epoch": 1.419172794566731, "percentage": 72.61, "elapsed_time": "1 day, 6:47:05", "remaining_time": "11:36:40", "throughput": 331.83, "total_tokens": 36775584} {"current_steps": 29050, "total_steps": 40000, "loss": 0.0765, "lr": 0.05214455747066789, "epoch": 1.4194170962304253, "percentage": 72.62, "elapsed_time": "1 day, 6:47:09", "remaining_time": "11:36:15", "throughput": 331.88, "total_tokens": 36782240} {"current_steps": 29055, "total_steps": 40000, "loss": 0.05, "lr": 0.05209992096474048, "epoch": 1.4196613978941197, "percentage": 72.64, "elapsed_time": "1 day, 6:47:12", "remaining_time": "11:35:50", "throughput": 331.93, "total_tokens": 36788576} {"current_steps": 29060, "total_steps": 40000, "loss": 0.0578, "lr": 0.05205529955623559, "epoch": 1.4199056995578139, "percentage": 72.65, "elapsed_time": "1 day, 6:47:15", "remaining_time": "11:35:25", "throughput": 331.98, "total_tokens": 36795008} {"current_steps": 29065, "total_steps": 40000, "loss": 0.0774, "lr": 0.052010693252034314, "epoch": 1.4201500012215083, "percentage": 72.66, "elapsed_time": "1 day, 6:47:18", "remaining_time": "11:35:00", "throughput": 332.02, "total_tokens": 36800960} {"current_steps": 29070, "total_steps": 40000, "loss": 0.0609, "lr": 0.0519661020590156, "epoch": 1.4203943028852026, "percentage": 72.67, "elapsed_time": "1 day, 6:47:21", "remaining_time": "11:34:35", "throughput": 332.07, "total_tokens": 36807328} {"current_steps": 29075, "total_steps": 40000, "loss": 0.0474, "lr": 0.05192152598405586, "epoch": 1.420638604548897, "percentage": 72.69, "elapsed_time": "1 day, 6:47:24", "remaining_time": "11:34:10", "throughput": 332.12, "total_tokens": 36813440} {"current_steps": 29080, "total_steps": 40000, "loss": 0.0629, "lr": 0.05187696503402941, "epoch": 1.4208829062125914, "percentage": 72.7, "elapsed_time": "1 day, 6:47:27", "remaining_time": "11:33:45", "throughput": 332.17, "total_tokens": 36820576} {"current_steps": 29085, "total_steps": 40000, "loss": 0.0828, "lr": 0.05183241921580798, "epoch": 1.4211272078762858, "percentage": 72.71, "elapsed_time": "1 day, 6:47:30", "remaining_time": "11:33:19", "throughput": 332.22, "total_tokens": 36827008} {"current_steps": 29090, "total_steps": 40000, "loss": 0.054, "lr": 0.051787888536261206, "epoch": 1.42137150953998, "percentage": 72.72, "elapsed_time": "1 day, 6:47:33", "remaining_time": "11:32:54", "throughput": 332.27, "total_tokens": 36833216} {"current_steps": 29095, "total_steps": 40000, "loss": 0.062, "lr": 0.051743373002256184, "epoch": 1.4216158112036743, "percentage": 72.74, "elapsed_time": "1 day, 6:47:36", "remaining_time": "11:32:29", "throughput": 332.32, "total_tokens": 36839744} {"current_steps": 29100, "total_steps": 40000, "loss": 0.055, "lr": 0.05169887262065787, "epoch": 1.4218601128673687, "percentage": 72.75, "elapsed_time": "1 day, 6:47:40", "remaining_time": "11:32:04", "throughput": 332.37, "total_tokens": 36846048} {"current_steps": 29105, "total_steps": 40000, "loss": 0.0639, "lr": 0.051654387398328665, "epoch": 1.4221044145310628, "percentage": 72.76, "elapsed_time": "1 day, 6:47:43", "remaining_time": "11:31:39", "throughput": 332.41, "total_tokens": 36852288} {"current_steps": 29110, "total_steps": 40000, "loss": 0.0629, "lr": 0.05160991734212888, "epoch": 1.4223487161947572, "percentage": 72.78, "elapsed_time": "1 day, 6:47:46", "remaining_time": "11:31:14", "throughput": 332.46, "total_tokens": 36858560} {"current_steps": 29115, "total_steps": 40000, "loss": 0.0586, "lr": 0.051565462458916224, "epoch": 1.4225930178584516, "percentage": 72.79, "elapsed_time": "1 day, 6:47:49", "remaining_time": "11:30:49", "throughput": 332.51, "total_tokens": 36864672} {"current_steps": 29120, "total_steps": 40000, "loss": 0.0548, "lr": 0.05152102275554627, "epoch": 1.422837319522146, "percentage": 72.8, "elapsed_time": "1 day, 6:47:52", "remaining_time": "11:30:24", "throughput": 332.55, "total_tokens": 36870976} {"current_steps": 29125, "total_steps": 40000, "loss": 0.0824, "lr": 0.05147659823887222, "epoch": 1.4230816211858404, "percentage": 72.81, "elapsed_time": "1 day, 6:47:55", "remaining_time": "11:29:59", "throughput": 332.6, "total_tokens": 36877312} {"current_steps": 29130, "total_steps": 40000, "loss": 0.0373, "lr": 0.05143218891574479, "epoch": 1.4233259228495347, "percentage": 72.82, "elapsed_time": "1 day, 6:47:58", "remaining_time": "11:29:34", "throughput": 332.65, "total_tokens": 36883520} {"current_steps": 29135, "total_steps": 40000, "loss": 0.0295, "lr": 0.0513877947930125, "epoch": 1.423570224513229, "percentage": 72.84, "elapsed_time": "1 day, 6:48:01", "remaining_time": "11:29:09", "throughput": 332.7, "total_tokens": 36890016} {"current_steps": 29140, "total_steps": 40000, "loss": 0.0557, "lr": 0.051343415877521566, "epoch": 1.4238145261769233, "percentage": 72.85, "elapsed_time": "1 day, 6:48:04", "remaining_time": "11:28:44", "throughput": 332.74, "total_tokens": 36896064} {"current_steps": 29145, "total_steps": 40000, "loss": 0.0424, "lr": 0.051299052176115634, "epoch": 1.4240588278406177, "percentage": 72.86, "elapsed_time": "1 day, 6:48:07", "remaining_time": "11:28:19", "throughput": 332.79, "total_tokens": 36902848} {"current_steps": 29150, "total_steps": 40000, "loss": 0.0371, "lr": 0.051254703695636256, "epoch": 1.4243031295043118, "percentage": 72.88, "elapsed_time": "1 day, 6:48:10", "remaining_time": "11:27:55", "throughput": 332.84, "total_tokens": 36909440} {"current_steps": 29155, "total_steps": 40000, "loss": 0.0453, "lr": 0.05121037044292249, "epoch": 1.4245474311680062, "percentage": 72.89, "elapsed_time": "1 day, 6:48:14", "remaining_time": "11:27:30", "throughput": 332.89, "total_tokens": 36916000} {"current_steps": 29160, "total_steps": 40000, "loss": 0.0437, "lr": 0.05116605242481101, "epoch": 1.4247917328317006, "percentage": 72.9, "elapsed_time": "1 day, 6:48:17", "remaining_time": "11:27:05", "throughput": 332.94, "total_tokens": 36921760} {"current_steps": 29165, "total_steps": 40000, "loss": 0.0503, "lr": 0.05112174964813634, "epoch": 1.425036034495395, "percentage": 72.91, "elapsed_time": "1 day, 6:48:20", "remaining_time": "11:26:40", "throughput": 332.98, "total_tokens": 36928032} {"current_steps": 29170, "total_steps": 40000, "loss": 0.0431, "lr": 0.05107746211973038, "epoch": 1.4252803361590893, "percentage": 72.92, "elapsed_time": "1 day, 6:48:23", "remaining_time": "11:26:15", "throughput": 333.03, "total_tokens": 36934272} {"current_steps": 29175, "total_steps": 40000, "loss": 0.0264, "lr": 0.05103318984642291, "epoch": 1.4255246378227835, "percentage": 72.94, "elapsed_time": "1 day, 6:48:26", "remaining_time": "11:25:50", "throughput": 333.08, "total_tokens": 36940736} {"current_steps": 29180, "total_steps": 40000, "loss": 0.0443, "lr": 0.05098893283504131, "epoch": 1.4257689394864779, "percentage": 72.95, "elapsed_time": "1 day, 6:48:29", "remaining_time": "11:25:25", "throughput": 333.13, "total_tokens": 36946848} {"current_steps": 29185, "total_steps": 40000, "loss": 0.0845, "lr": 0.050944691092410475, "epoch": 1.4260132411501723, "percentage": 72.96, "elapsed_time": "1 day, 6:48:32", "remaining_time": "11:25:00", "throughput": 333.17, "total_tokens": 36952960} {"current_steps": 29190, "total_steps": 40000, "loss": 0.0523, "lr": 0.05090046462535313, "epoch": 1.4262575428138666, "percentage": 72.97, "elapsed_time": "1 day, 6:48:35", "remaining_time": "11:24:35", "throughput": 333.22, "total_tokens": 36959200} {"current_steps": 29195, "total_steps": 40000, "loss": 0.0469, "lr": 0.050856253440689454, "epoch": 1.4265018444775608, "percentage": 72.99, "elapsed_time": "1 day, 6:48:38", "remaining_time": "11:24:10", "throughput": 333.27, "total_tokens": 36965440} {"current_steps": 29200, "total_steps": 40000, "loss": 0.0452, "lr": 0.050812057545237405, "epoch": 1.4267461461412552, "percentage": 73.0, "elapsed_time": "1 day, 6:48:41", "remaining_time": "11:23:45", "throughput": 333.31, "total_tokens": 36971744} {"current_steps": 29200, "total_steps": 40000, "eval_loss": 0.06298601627349854, "epoch": 1.4267461461412552, "percentage": 73.0, "elapsed_time": "1 day, 6:59:22", "remaining_time": "11:27:42", "throughput": 331.4, "total_tokens": 36971744} {"current_steps": 29205, "total_steps": 40000, "loss": 0.0555, "lr": 0.0507678769458126, "epoch": 1.4269904478049495, "percentage": 73.01, "elapsed_time": "1 day, 6:59:26", "remaining_time": "11:27:18", "throughput": 331.44, "total_tokens": 36977952} {"current_steps": 29210, "total_steps": 40000, "loss": 0.0619, "lr": 0.050723711649228155, "epoch": 1.427234749468644, "percentage": 73.02, "elapsed_time": "1 day, 6:59:29", "remaining_time": "11:26:52", "throughput": 331.49, "total_tokens": 36984288} {"current_steps": 29215, "total_steps": 40000, "loss": 0.0743, "lr": 0.05067956166229496, "epoch": 1.4274790511323383, "percentage": 73.04, "elapsed_time": "1 day, 6:59:32", "remaining_time": "11:26:27", "throughput": 331.54, "total_tokens": 36990208} {"current_steps": 29220, "total_steps": 40000, "loss": 0.055, "lr": 0.05063542699182155, "epoch": 1.4277233527960325, "percentage": 73.05, "elapsed_time": "1 day, 6:59:35", "remaining_time": "11:26:02", "throughput": 331.58, "total_tokens": 36996320} {"current_steps": 29225, "total_steps": 40000, "loss": 0.0831, "lr": 0.050591307644613996, "epoch": 1.4279676544597268, "percentage": 73.06, "elapsed_time": "1 day, 6:59:38", "remaining_time": "11:25:37", "throughput": 331.63, "total_tokens": 37003168} {"current_steps": 29230, "total_steps": 40000, "loss": 0.0935, "lr": 0.05054720362747599, "epoch": 1.4282119561234212, "percentage": 73.08, "elapsed_time": "1 day, 6:59:41", "remaining_time": "11:25:12", "throughput": 331.68, "total_tokens": 37009504} {"current_steps": 29235, "total_steps": 40000, "loss": 0.0712, "lr": 0.050503114947209035, "epoch": 1.4284562577871156, "percentage": 73.09, "elapsed_time": "1 day, 6:59:44", "remaining_time": "11:24:47", "throughput": 331.73, "total_tokens": 37015808} {"current_steps": 29240, "total_steps": 40000, "loss": 0.0475, "lr": 0.05045904161061207, "epoch": 1.4287005594508098, "percentage": 73.1, "elapsed_time": "1 day, 6:59:47", "remaining_time": "11:24:23", "throughput": 331.78, "total_tokens": 37022528} {"current_steps": 29245, "total_steps": 40000, "loss": 0.0635, "lr": 0.05041498362448185, "epoch": 1.4289448611145041, "percentage": 73.11, "elapsed_time": "1 day, 6:59:50", "remaining_time": "11:23:58", "throughput": 331.83, "total_tokens": 37028992} {"current_steps": 29250, "total_steps": 40000, "loss": 0.0467, "lr": 0.05037094099561256, "epoch": 1.4291891627781985, "percentage": 73.12, "elapsed_time": "1 day, 6:59:54", "remaining_time": "11:23:33", "throughput": 331.88, "total_tokens": 37035488} {"current_steps": 29255, "total_steps": 40000, "loss": 0.0503, "lr": 0.05032691373079624, "epoch": 1.429433464441893, "percentage": 73.14, "elapsed_time": "1 day, 6:59:57", "remaining_time": "11:23:08", "throughput": 331.93, "total_tokens": 37042336} {"current_steps": 29260, "total_steps": 40000, "loss": 0.0583, "lr": 0.05028290183682234, "epoch": 1.4296777661055873, "percentage": 73.15, "elapsed_time": "1 day, 7:00:00", "remaining_time": "11:22:43", "throughput": 331.97, "total_tokens": 37048320} {"current_steps": 29265, "total_steps": 40000, "loss": 0.0539, "lr": 0.050238905320478096, "epoch": 1.4299220677692814, "percentage": 73.16, "elapsed_time": "1 day, 7:00:03", "remaining_time": "11:22:18", "throughput": 332.02, "total_tokens": 37055040} {"current_steps": 29270, "total_steps": 40000, "loss": 0.0724, "lr": 0.05019492418854838, "epoch": 1.4301663694329758, "percentage": 73.17, "elapsed_time": "1 day, 7:00:06", "remaining_time": "11:21:53", "throughput": 332.07, "total_tokens": 37060960} {"current_steps": 29275, "total_steps": 40000, "loss": 0.0627, "lr": 0.05015095844781554, "epoch": 1.4304106710966702, "percentage": 73.19, "elapsed_time": "1 day, 7:00:09", "remaining_time": "11:21:28", "throughput": 332.12, "total_tokens": 37067584} {"current_steps": 29280, "total_steps": 40000, "loss": 0.0339, "lr": 0.05010700810505968, "epoch": 1.4306549727603646, "percentage": 73.2, "elapsed_time": "1 day, 7:00:12", "remaining_time": "11:21:03", "throughput": 332.16, "total_tokens": 37073472} {"current_steps": 29285, "total_steps": 40000, "loss": 0.0554, "lr": 0.05006307316705856, "epoch": 1.4308992744240587, "percentage": 73.21, "elapsed_time": "1 day, 7:00:15", "remaining_time": "11:20:38", "throughput": 332.21, "total_tokens": 37080096} {"current_steps": 29290, "total_steps": 40000, "loss": 0.0352, "lr": 0.0500191536405874, "epoch": 1.431143576087753, "percentage": 73.22, "elapsed_time": "1 day, 7:00:18", "remaining_time": "11:20:13", "throughput": 332.26, "total_tokens": 37086336} {"current_steps": 29295, "total_steps": 40000, "loss": 0.0569, "lr": 0.04997524953241922, "epoch": 1.4313878777514475, "percentage": 73.24, "elapsed_time": "1 day, 7:00:21", "remaining_time": "11:19:48", "throughput": 332.31, "total_tokens": 37092832} {"current_steps": 29300, "total_steps": 40000, "loss": 0.0436, "lr": 0.049931360849324556, "epoch": 1.4316321794151419, "percentage": 73.25, "elapsed_time": "1 day, 7:00:24", "remaining_time": "11:19:24", "throughput": 332.35, "total_tokens": 37098560} {"current_steps": 29305, "total_steps": 40000, "loss": 0.0417, "lr": 0.04988748759807155, "epoch": 1.4318764810788362, "percentage": 73.26, "elapsed_time": "1 day, 7:00:27", "remaining_time": "11:18:59", "throughput": 332.4, "total_tokens": 37104960} {"current_steps": 29310, "total_steps": 40000, "loss": 0.086, "lr": 0.0498436297854261, "epoch": 1.4321207827425304, "percentage": 73.28, "elapsed_time": "1 day, 7:00:30", "remaining_time": "11:18:34", "throughput": 332.44, "total_tokens": 37111072} {"current_steps": 29315, "total_steps": 40000, "loss": 0.0734, "lr": 0.04979978741815152, "epoch": 1.4323650844062248, "percentage": 73.29, "elapsed_time": "1 day, 7:00:34", "remaining_time": "11:18:09", "throughput": 332.49, "total_tokens": 37117504} {"current_steps": 29320, "total_steps": 40000, "loss": 0.0663, "lr": 0.04975596050300891, "epoch": 1.4326093860699192, "percentage": 73.3, "elapsed_time": "1 day, 7:00:37", "remaining_time": "11:17:44", "throughput": 332.54, "total_tokens": 37123904} {"current_steps": 29325, "total_steps": 40000, "loss": 0.042, "lr": 0.049712149046757005, "epoch": 1.4328536877336135, "percentage": 73.31, "elapsed_time": "1 day, 7:00:40", "remaining_time": "11:17:19", "throughput": 332.59, "total_tokens": 37129952} {"current_steps": 29330, "total_steps": 40000, "loss": 0.0561, "lr": 0.04966835305615194, "epoch": 1.4330979893973077, "percentage": 73.32, "elapsed_time": "1 day, 7:00:43", "remaining_time": "11:16:54", "throughput": 332.63, "total_tokens": 37136224} {"current_steps": 29335, "total_steps": 40000, "loss": 0.0793, "lr": 0.049624572537947755, "epoch": 1.433342291061002, "percentage": 73.34, "elapsed_time": "1 day, 7:00:46", "remaining_time": "11:16:30", "throughput": 332.68, "total_tokens": 37142656} {"current_steps": 29340, "total_steps": 40000, "loss": 0.0575, "lr": 0.04958080749889582, "epoch": 1.4335865927246965, "percentage": 73.35, "elapsed_time": "1 day, 7:00:49", "remaining_time": "11:16:05", "throughput": 332.73, "total_tokens": 37148960} {"current_steps": 29345, "total_steps": 40000, "loss": 0.0516, "lr": 0.049537057945745304, "epoch": 1.4338308943883908, "percentage": 73.36, "elapsed_time": "1 day, 7:00:52", "remaining_time": "11:15:40", "throughput": 332.78, "total_tokens": 37155360} {"current_steps": 29350, "total_steps": 40000, "loss": 0.0745, "lr": 0.049493323885243, "epoch": 1.4340751960520852, "percentage": 73.38, "elapsed_time": "1 day, 7:00:55", "remaining_time": "11:15:15", "throughput": 332.82, "total_tokens": 37161728} {"current_steps": 29355, "total_steps": 40000, "loss": 0.0295, "lr": 0.04944960532413318, "epoch": 1.4343194977157794, "percentage": 73.39, "elapsed_time": "1 day, 7:00:58", "remaining_time": "11:14:50", "throughput": 332.87, "total_tokens": 37167872} {"current_steps": 29360, "total_steps": 40000, "loss": 0.0375, "lr": 0.049405902269157774, "epoch": 1.4345637993794738, "percentage": 73.4, "elapsed_time": "1 day, 7:01:01", "remaining_time": "11:14:26", "throughput": 332.92, "total_tokens": 37174208} {"current_steps": 29365, "total_steps": 40000, "loss": 0.0541, "lr": 0.04936221472705646, "epoch": 1.4348081010431681, "percentage": 73.41, "elapsed_time": "1 day, 7:01:05", "remaining_time": "11:14:01", "throughput": 332.98, "total_tokens": 37182240} {"current_steps": 29370, "total_steps": 40000, "loss": 0.0359, "lr": 0.04931854270456632, "epoch": 1.4350524027068623, "percentage": 73.42, "elapsed_time": "1 day, 7:01:08", "remaining_time": "11:13:36", "throughput": 333.03, "total_tokens": 37188352} {"current_steps": 29375, "total_steps": 40000, "loss": 0.0592, "lr": 0.049274886208422075, "epoch": 1.4352967043705567, "percentage": 73.44, "elapsed_time": "1 day, 7:01:11", "remaining_time": "11:13:11", "throughput": 333.07, "total_tokens": 37194784} {"current_steps": 29380, "total_steps": 40000, "loss": 0.0436, "lr": 0.049231245245356235, "epoch": 1.435541006034251, "percentage": 73.45, "elapsed_time": "1 day, 7:01:14", "remaining_time": "11:12:47", "throughput": 333.12, "total_tokens": 37201024} {"current_steps": 29385, "total_steps": 40000, "loss": 0.053, "lr": 0.049187619822098655, "epoch": 1.4357853076979454, "percentage": 73.46, "elapsed_time": "1 day, 7:01:17", "remaining_time": "11:12:22", "throughput": 333.17, "total_tokens": 37207264} {"current_steps": 29390, "total_steps": 40000, "loss": 0.0396, "lr": 0.04914400994537705, "epoch": 1.4360296093616398, "percentage": 73.47, "elapsed_time": "1 day, 7:01:20", "remaining_time": "11:11:57", "throughput": 333.22, "total_tokens": 37213824} {"current_steps": 29395, "total_steps": 40000, "loss": 0.054, "lr": 0.049100415621916485, "epoch": 1.4362739110253342, "percentage": 73.49, "elapsed_time": "1 day, 7:01:23", "remaining_time": "11:11:32", "throughput": 333.26, "total_tokens": 37220000} {"current_steps": 29400, "total_steps": 40000, "loss": 0.0515, "lr": 0.04905683685843981, "epoch": 1.4365182126890284, "percentage": 73.5, "elapsed_time": "1 day, 7:01:26", "remaining_time": "11:11:08", "throughput": 333.31, "total_tokens": 37226208} {"current_steps": 29400, "total_steps": 40000, "eval_loss": 0.06252748519182205, "epoch": 1.4365182126890284, "percentage": 73.5, "elapsed_time": "1 day, 7:12:07", "remaining_time": "11:14:58", "throughput": 331.41, "total_tokens": 37226208} {"current_steps": 29405, "total_steps": 40000, "loss": 0.0455, "lr": 0.049013273661667495, "epoch": 1.4367625143527227, "percentage": 73.51, "elapsed_time": "1 day, 7:12:10", "remaining_time": "11:14:34", "throughput": 331.45, "total_tokens": 37232480} {"current_steps": 29410, "total_steps": 40000, "loss": 0.0477, "lr": 0.048969726038317396, "epoch": 1.437006816016417, "percentage": 73.52, "elapsed_time": "1 day, 7:12:14", "remaining_time": "11:14:09", "throughput": 331.5, "total_tokens": 37239328} {"current_steps": 29415, "total_steps": 40000, "loss": 0.0737, "lr": 0.048926193995105206, "epoch": 1.4372511176801113, "percentage": 73.54, "elapsed_time": "1 day, 7:12:17", "remaining_time": "11:13:44", "throughput": 331.55, "total_tokens": 37244992} {"current_steps": 29420, "total_steps": 40000, "loss": 0.0697, "lr": 0.048882677538744035, "epoch": 1.4374954193438056, "percentage": 73.55, "elapsed_time": "1 day, 7:12:20", "remaining_time": "11:13:19", "throughput": 331.59, "total_tokens": 37251136} {"current_steps": 29425, "total_steps": 40000, "loss": 0.0374, "lr": 0.048839176675944715, "epoch": 1.4377397210075, "percentage": 73.56, "elapsed_time": "1 day, 7:12:23", "remaining_time": "11:12:54", "throughput": 331.64, "total_tokens": 37257728} {"current_steps": 29430, "total_steps": 40000, "loss": 0.0487, "lr": 0.04879569141341566, "epoch": 1.4379840226711944, "percentage": 73.58, "elapsed_time": "1 day, 7:12:26", "remaining_time": "11:12:30", "throughput": 331.69, "total_tokens": 37264000} {"current_steps": 29435, "total_steps": 40000, "loss": 0.0725, "lr": 0.04875222175786274, "epoch": 1.4382283243348888, "percentage": 73.59, "elapsed_time": "1 day, 7:12:29", "remaining_time": "11:12:05", "throughput": 331.73, "total_tokens": 37269888} {"current_steps": 29440, "total_steps": 40000, "loss": 0.0523, "lr": 0.04870876771598966, "epoch": 1.4384726259985832, "percentage": 73.6, "elapsed_time": "1 day, 7:12:32", "remaining_time": "11:11:40", "throughput": 331.78, "total_tokens": 37276416} {"current_steps": 29445, "total_steps": 40000, "loss": 0.0263, "lr": 0.04866532929449744, "epoch": 1.4387169276622773, "percentage": 73.61, "elapsed_time": "1 day, 7:12:35", "remaining_time": "11:11:15", "throughput": 331.83, "total_tokens": 37283488} {"current_steps": 29450, "total_steps": 40000, "loss": 0.0651, "lr": 0.048621906500084945, "epoch": 1.4389612293259717, "percentage": 73.62, "elapsed_time": "1 day, 7:12:38", "remaining_time": "11:10:50", "throughput": 331.88, "total_tokens": 37289792} {"current_steps": 29455, "total_steps": 40000, "loss": 0.0408, "lr": 0.04857849933944845, "epoch": 1.439205530989666, "percentage": 73.64, "elapsed_time": "1 day, 7:12:41", "remaining_time": "11:10:25", "throughput": 331.93, "total_tokens": 37295808} {"current_steps": 29460, "total_steps": 40000, "loss": 0.0639, "lr": 0.048535107819281866, "epoch": 1.4394498326533602, "percentage": 73.65, "elapsed_time": "1 day, 7:12:44", "remaining_time": "11:10:01", "throughput": 331.97, "total_tokens": 37302272} {"current_steps": 29465, "total_steps": 40000, "loss": 0.0423, "lr": 0.04849173194627675, "epoch": 1.4396941343170546, "percentage": 73.66, "elapsed_time": "1 day, 7:12:48", "remaining_time": "11:09:36", "throughput": 332.02, "total_tokens": 37308960} {"current_steps": 29470, "total_steps": 40000, "loss": 0.0464, "lr": 0.04844837172712223, "epoch": 1.439938435980749, "percentage": 73.67, "elapsed_time": "1 day, 7:12:51", "remaining_time": "11:09:11", "throughput": 332.07, "total_tokens": 37315552} {"current_steps": 29475, "total_steps": 40000, "loss": 0.0354, "lr": 0.04840502716850494, "epoch": 1.4401827376444434, "percentage": 73.69, "elapsed_time": "1 day, 7:12:54", "remaining_time": "11:08:46", "throughput": 332.12, "total_tokens": 37322080} {"current_steps": 29480, "total_steps": 40000, "loss": 0.0546, "lr": 0.04836169827710916, "epoch": 1.4404270393081378, "percentage": 73.7, "elapsed_time": "1 day, 7:12:57", "remaining_time": "11:08:22", "throughput": 332.17, "total_tokens": 37328064} {"current_steps": 29485, "total_steps": 40000, "loss": 0.0461, "lr": 0.04831838505961684, "epoch": 1.4406713409718321, "percentage": 73.71, "elapsed_time": "1 day, 7:13:00", "remaining_time": "11:07:57", "throughput": 332.21, "total_tokens": 37334304} {"current_steps": 29490, "total_steps": 40000, "loss": 0.059, "lr": 0.048275087522707295, "epoch": 1.4409156426355263, "percentage": 73.72, "elapsed_time": "1 day, 7:13:03", "remaining_time": "11:07:32", "throughput": 332.26, "total_tokens": 37341024} {"current_steps": 29495, "total_steps": 40000, "loss": 0.0363, "lr": 0.04823180567305766, "epoch": 1.4411599442992207, "percentage": 73.74, "elapsed_time": "1 day, 7:13:06", "remaining_time": "11:07:07", "throughput": 332.32, "total_tokens": 37348064} {"current_steps": 29500, "total_steps": 40000, "loss": 0.0642, "lr": 0.04818853951734244, "epoch": 1.441404245962915, "percentage": 73.75, "elapsed_time": "1 day, 7:13:10", "remaining_time": "11:06:43", "throughput": 332.37, "total_tokens": 37354528} {"current_steps": 29505, "total_steps": 40000, "loss": 0.0678, "lr": 0.04814528906223387, "epoch": 1.4416485476266092, "percentage": 73.76, "elapsed_time": "1 day, 7:13:13", "remaining_time": "11:06:18", "throughput": 332.41, "total_tokens": 37360384} {"current_steps": 29510, "total_steps": 40000, "loss": 0.0285, "lr": 0.04810205431440177, "epoch": 1.4418928492903036, "percentage": 73.78, "elapsed_time": "1 day, 7:13:16", "remaining_time": "11:05:53", "throughput": 332.45, "total_tokens": 37366496} {"current_steps": 29515, "total_steps": 40000, "loss": 0.0544, "lr": 0.04805883528051341, "epoch": 1.442137150953998, "percentage": 73.79, "elapsed_time": "1 day, 7:13:19", "remaining_time": "11:05:29", "throughput": 332.5, "total_tokens": 37372544} {"current_steps": 29520, "total_steps": 40000, "loss": 0.0492, "lr": 0.048015631967233685, "epoch": 1.4423814526176924, "percentage": 73.8, "elapsed_time": "1 day, 7:13:22", "remaining_time": "11:05:04", "throughput": 332.55, "total_tokens": 37379104} {"current_steps": 29525, "total_steps": 40000, "loss": 0.0905, "lr": 0.04797244438122517, "epoch": 1.4426257542813867, "percentage": 73.81, "elapsed_time": "1 day, 7:13:25", "remaining_time": "11:04:39", "throughput": 332.59, "total_tokens": 37385376} {"current_steps": 29530, "total_steps": 40000, "loss": 0.0545, "lr": 0.04792927252914784, "epoch": 1.442870055945081, "percentage": 73.83, "elapsed_time": "1 day, 7:13:28", "remaining_time": "11:04:14", "throughput": 332.64, "total_tokens": 37391616} {"current_steps": 29535, "total_steps": 40000, "loss": 0.0692, "lr": 0.04788611641765944, "epoch": 1.4431143576087753, "percentage": 73.84, "elapsed_time": "1 day, 7:13:31", "remaining_time": "11:03:50", "throughput": 332.69, "total_tokens": 37397696} {"current_steps": 29540, "total_steps": 40000, "loss": 0.0649, "lr": 0.04784297605341508, "epoch": 1.4433586592724696, "percentage": 73.85, "elapsed_time": "1 day, 7:13:34", "remaining_time": "11:03:25", "throughput": 332.73, "total_tokens": 37404224} {"current_steps": 29545, "total_steps": 40000, "loss": 0.039, "lr": 0.04779985144306761, "epoch": 1.443602960936164, "percentage": 73.86, "elapsed_time": "1 day, 7:13:37", "remaining_time": "11:03:00", "throughput": 332.78, "total_tokens": 37410400} {"current_steps": 29550, "total_steps": 40000, "loss": 0.0618, "lr": 0.047756742593267405, "epoch": 1.4438472625998582, "percentage": 73.88, "elapsed_time": "1 day, 7:13:40", "remaining_time": "11:02:36", "throughput": 332.82, "total_tokens": 37416320} {"current_steps": 29555, "total_steps": 40000, "loss": 0.04, "lr": 0.047713649510662315, "epoch": 1.4440915642635526, "percentage": 73.89, "elapsed_time": "1 day, 7:13:43", "remaining_time": "11:02:11", "throughput": 332.87, "total_tokens": 37422848} {"current_steps": 29560, "total_steps": 40000, "loss": 0.0544, "lr": 0.04767057220189789, "epoch": 1.444335865927247, "percentage": 73.9, "elapsed_time": "1 day, 7:13:46", "remaining_time": "11:01:46", "throughput": 332.92, "total_tokens": 37428512} {"current_steps": 29565, "total_steps": 40000, "loss": 0.0366, "lr": 0.04762751067361722, "epoch": 1.4445801675909413, "percentage": 73.91, "elapsed_time": "1 day, 7:13:49", "remaining_time": "11:01:22", "throughput": 332.96, "total_tokens": 37434784} {"current_steps": 29570, "total_steps": 40000, "loss": 0.0688, "lr": 0.04758446493246086, "epoch": 1.4448244692546357, "percentage": 73.92, "elapsed_time": "1 day, 7:13:52", "remaining_time": "11:00:57", "throughput": 333.01, "total_tokens": 37441120} {"current_steps": 29575, "total_steps": 40000, "loss": 0.0771, "lr": 0.047541434985067084, "epoch": 1.44506877091833, "percentage": 73.94, "elapsed_time": "1 day, 7:13:55", "remaining_time": "11:00:32", "throughput": 333.05, "total_tokens": 37446816} {"current_steps": 29580, "total_steps": 40000, "loss": 0.0453, "lr": 0.047498420838071556, "epoch": 1.4453130725820242, "percentage": 73.95, "elapsed_time": "1 day, 7:13:58", "remaining_time": "11:00:08", "throughput": 333.1, "total_tokens": 37453088} {"current_steps": 29585, "total_steps": 40000, "loss": 0.0553, "lr": 0.04745542249810772, "epoch": 1.4455573742457186, "percentage": 73.96, "elapsed_time": "1 day, 7:14:01", "remaining_time": "10:59:43", "throughput": 333.14, "total_tokens": 37459392} {"current_steps": 29590, "total_steps": 40000, "loss": 0.0542, "lr": 0.047412439971806324, "epoch": 1.445801675909413, "percentage": 73.98, "elapsed_time": "1 day, 7:14:04", "remaining_time": "10:59:19", "throughput": 333.19, "total_tokens": 37465568} {"current_steps": 29595, "total_steps": 40000, "loss": 0.0708, "lr": 0.04736947326579592, "epoch": 1.4460459775731072, "percentage": 73.99, "elapsed_time": "1 day, 7:14:08", "remaining_time": "10:58:54", "throughput": 333.24, "total_tokens": 37471840} {"current_steps": 29600, "total_steps": 40000, "loss": 0.0451, "lr": 0.04732652238670245, "epoch": 1.4462902792368015, "percentage": 74.0, "elapsed_time": "1 day, 7:14:11", "remaining_time": "10:58:29", "throughput": 333.29, "total_tokens": 37479008} {"current_steps": 29600, "total_steps": 40000, "eval_loss": 0.06261797249317169, "epoch": 1.4462902792368015, "percentage": 74.0, "elapsed_time": "1 day, 7:24:52", "remaining_time": "11:02:15", "throughput": 331.4, "total_tokens": 37479008} {"current_steps": 29605, "total_steps": 40000, "loss": 0.0362, "lr": 0.04728358734114952, "epoch": 1.446534580900496, "percentage": 74.01, "elapsed_time": "1 day, 7:24:56", "remaining_time": "11:01:50", "throughput": 331.44, "total_tokens": 37485088} {"current_steps": 29610, "total_steps": 40000, "loss": 0.0893, "lr": 0.04724066813575821, "epoch": 1.4467788825641903, "percentage": 74.02, "elapsed_time": "1 day, 7:24:59", "remaining_time": "11:01:26", "throughput": 331.49, "total_tokens": 37491584} {"current_steps": 29615, "total_steps": 40000, "loss": 0.0698, "lr": 0.04719776477714729, "epoch": 1.4470231842278847, "percentage": 74.04, "elapsed_time": "1 day, 7:25:02", "remaining_time": "11:01:01", "throughput": 331.54, "total_tokens": 37497920} {"current_steps": 29620, "total_steps": 40000, "loss": 0.0498, "lr": 0.047154877271932856, "epoch": 1.447267485891579, "percentage": 74.05, "elapsed_time": "1 day, 7:25:05", "remaining_time": "11:00:36", "throughput": 331.59, "total_tokens": 37504992} {"current_steps": 29625, "total_steps": 40000, "loss": 0.0815, "lr": 0.0471120056267288, "epoch": 1.4475117875552732, "percentage": 74.06, "elapsed_time": "1 day, 7:25:08", "remaining_time": "11:00:12", "throughput": 331.64, "total_tokens": 37511776} {"current_steps": 29630, "total_steps": 40000, "loss": 0.1175, "lr": 0.047069149848146495, "epoch": 1.4477560892189676, "percentage": 74.08, "elapsed_time": "1 day, 7:25:12", "remaining_time": "10:59:47", "throughput": 331.69, "total_tokens": 37517760} {"current_steps": 29635, "total_steps": 40000, "loss": 0.0424, "lr": 0.04702630994279473, "epoch": 1.448000390882662, "percentage": 74.09, "elapsed_time": "1 day, 7:25:15", "remaining_time": "10:59:22", "throughput": 331.73, "total_tokens": 37523872} {"current_steps": 29640, "total_steps": 40000, "loss": 0.0432, "lr": 0.046983485917280035, "epoch": 1.4482446925463561, "percentage": 74.1, "elapsed_time": "1 day, 7:25:18", "remaining_time": "10:58:57", "throughput": 331.78, "total_tokens": 37530240} {"current_steps": 29645, "total_steps": 40000, "loss": 0.0751, "lr": 0.04694067777820644, "epoch": 1.4484889942100505, "percentage": 74.11, "elapsed_time": "1 day, 7:25:21", "remaining_time": "10:58:33", "throughput": 331.83, "total_tokens": 37536448} {"current_steps": 29650, "total_steps": 40000, "loss": 0.0799, "lr": 0.046897885532175415, "epoch": 1.4487332958737449, "percentage": 74.12, "elapsed_time": "1 day, 7:25:24", "remaining_time": "10:58:08", "throughput": 331.87, "total_tokens": 37542400} {"current_steps": 29655, "total_steps": 40000, "loss": 0.0518, "lr": 0.04685510918578613, "epoch": 1.4489775975374393, "percentage": 74.14, "elapsed_time": "1 day, 7:25:27", "remaining_time": "10:57:43", "throughput": 331.91, "total_tokens": 37548608} {"current_steps": 29660, "total_steps": 40000, "loss": 0.0573, "lr": 0.04681234874563519, "epoch": 1.4492218992011336, "percentage": 74.15, "elapsed_time": "1 day, 7:25:30", "remaining_time": "10:57:19", "throughput": 331.96, "total_tokens": 37555072} {"current_steps": 29665, "total_steps": 40000, "loss": 0.0634, "lr": 0.046769604218316836, "epoch": 1.449466200864828, "percentage": 74.16, "elapsed_time": "1 day, 7:25:33", "remaining_time": "10:56:54", "throughput": 332.01, "total_tokens": 37561344} {"current_steps": 29670, "total_steps": 40000, "loss": 0.0559, "lr": 0.04672687561042279, "epoch": 1.4497105025285222, "percentage": 74.17, "elapsed_time": "1 day, 7:25:36", "remaining_time": "10:56:29", "throughput": 332.06, "total_tokens": 37567616} {"current_steps": 29675, "total_steps": 40000, "loss": 0.0559, "lr": 0.046684162928542286, "epoch": 1.4499548041922166, "percentage": 74.19, "elapsed_time": "1 day, 7:25:39", "remaining_time": "10:56:05", "throughput": 332.1, "total_tokens": 37574048} {"current_steps": 29680, "total_steps": 40000, "loss": 0.053, "lr": 0.04664146617926222, "epoch": 1.450199105855911, "percentage": 74.2, "elapsed_time": "1 day, 7:25:42", "remaining_time": "10:55:40", "throughput": 332.15, "total_tokens": 37579872} {"current_steps": 29685, "total_steps": 40000, "loss": 0.0621, "lr": 0.046598785369167, "epoch": 1.450443407519605, "percentage": 74.21, "elapsed_time": "1 day, 7:25:45", "remaining_time": "10:55:16", "throughput": 332.19, "total_tokens": 37586080} {"current_steps": 29690, "total_steps": 40000, "loss": 0.0411, "lr": 0.046556120504838434, "epoch": 1.4506877091832995, "percentage": 74.22, "elapsed_time": "1 day, 7:25:48", "remaining_time": "10:54:51", "throughput": 332.23, "total_tokens": 37591904} {"current_steps": 29695, "total_steps": 40000, "loss": 0.0584, "lr": 0.04651347159285609, "epoch": 1.4509320108469939, "percentage": 74.24, "elapsed_time": "1 day, 7:25:51", "remaining_time": "10:54:26", "throughput": 332.28, "total_tokens": 37598400} {"current_steps": 29700, "total_steps": 40000, "loss": 0.0566, "lr": 0.04647083863979688, "epoch": 1.4511763125106882, "percentage": 74.25, "elapsed_time": "1 day, 7:25:54", "remaining_time": "10:54:02", "throughput": 332.33, "total_tokens": 37604512} {"current_steps": 29705, "total_steps": 40000, "loss": 0.068, "lr": 0.04642822165223538, "epoch": 1.4514206141743826, "percentage": 74.26, "elapsed_time": "1 day, 7:25:58", "remaining_time": "10:53:37", "throughput": 332.37, "total_tokens": 37610624} {"current_steps": 29710, "total_steps": 40000, "loss": 0.0569, "lr": 0.046385620636743716, "epoch": 1.4516649158380768, "percentage": 74.28, "elapsed_time": "1 day, 7:26:01", "remaining_time": "10:53:13", "throughput": 332.42, "total_tokens": 37617408} {"current_steps": 29715, "total_steps": 40000, "loss": 0.0563, "lr": 0.04634303559989141, "epoch": 1.4519092175017712, "percentage": 74.29, "elapsed_time": "1 day, 7:26:04", "remaining_time": "10:52:48", "throughput": 332.47, "total_tokens": 37623744} {"current_steps": 29720, "total_steps": 40000, "loss": 0.0481, "lr": 0.046300466548245635, "epoch": 1.4521535191654655, "percentage": 74.3, "elapsed_time": "1 day, 7:26:07", "remaining_time": "10:52:24", "throughput": 332.52, "total_tokens": 37630528} {"current_steps": 29725, "total_steps": 40000, "loss": 0.0407, "lr": 0.04625791348837114, "epoch": 1.45239782082916, "percentage": 74.31, "elapsed_time": "1 day, 7:26:10", "remaining_time": "10:51:59", "throughput": 332.57, "total_tokens": 37636768} {"current_steps": 29730, "total_steps": 40000, "loss": 0.0672, "lr": 0.046215376426830095, "epoch": 1.452642122492854, "percentage": 74.33, "elapsed_time": "1 day, 7:26:13", "remaining_time": "10:51:35", "throughput": 332.62, "total_tokens": 37643680} {"current_steps": 29735, "total_steps": 40000, "loss": 0.0565, "lr": 0.04617285537018219, "epoch": 1.4528864241565485, "percentage": 74.34, "elapsed_time": "1 day, 7:26:16", "remaining_time": "10:51:10", "throughput": 332.67, "total_tokens": 37650080} {"current_steps": 29740, "total_steps": 40000, "loss": 0.0652, "lr": 0.046130350324984803, "epoch": 1.4531307258202428, "percentage": 74.35, "elapsed_time": "1 day, 7:26:19", "remaining_time": "10:50:45", "throughput": 332.71, "total_tokens": 37656192} {"current_steps": 29745, "total_steps": 40000, "loss": 0.0558, "lr": 0.046087861297792666, "epoch": 1.4533750274839372, "percentage": 74.36, "elapsed_time": "1 day, 7:26:23", "remaining_time": "10:50:21", "throughput": 332.76, "total_tokens": 37662560} {"current_steps": 29750, "total_steps": 40000, "loss": 0.0396, "lr": 0.0460453882951582, "epoch": 1.4536193291476316, "percentage": 74.38, "elapsed_time": "1 day, 7:26:26", "remaining_time": "10:49:56", "throughput": 332.81, "total_tokens": 37669056} {"current_steps": 29755, "total_steps": 40000, "loss": 0.0473, "lr": 0.04600293132363119, "epoch": 1.4538636308113257, "percentage": 74.39, "elapsed_time": "1 day, 7:26:29", "remaining_time": "10:49:32", "throughput": 332.85, "total_tokens": 37675200} {"current_steps": 29760, "total_steps": 40000, "loss": 0.045, "lr": 0.045960490389759086, "epoch": 1.4541079324750201, "percentage": 74.4, "elapsed_time": "1 day, 7:26:32", "remaining_time": "10:49:07", "throughput": 332.9, "total_tokens": 37681600} {"current_steps": 29765, "total_steps": 40000, "loss": 0.0824, "lr": 0.04591806550008685, "epoch": 1.4543522341387145, "percentage": 74.41, "elapsed_time": "1 day, 7:26:35", "remaining_time": "10:48:43", "throughput": 332.94, "total_tokens": 37687648} {"current_steps": 29770, "total_steps": 40000, "loss": 0.0658, "lr": 0.045875656661156825, "epoch": 1.4545965358024089, "percentage": 74.42, "elapsed_time": "1 day, 7:26:38", "remaining_time": "10:48:18", "throughput": 332.99, "total_tokens": 37693632} {"current_steps": 29775, "total_steps": 40000, "loss": 0.053, "lr": 0.04583326387950911, "epoch": 1.454840837466103, "percentage": 74.44, "elapsed_time": "1 day, 7:26:41", "remaining_time": "10:47:54", "throughput": 333.03, "total_tokens": 37699712} {"current_steps": 29780, "total_steps": 40000, "loss": 0.0405, "lr": 0.0457908871616811, "epoch": 1.4550851391297974, "percentage": 74.45, "elapsed_time": "1 day, 7:26:44", "remaining_time": "10:47:29", "throughput": 333.08, "total_tokens": 37705696} {"current_steps": 29785, "total_steps": 40000, "loss": 0.0307, "lr": 0.04574852651420786, "epoch": 1.4553294407934918, "percentage": 74.46, "elapsed_time": "1 day, 7:26:47", "remaining_time": "10:47:05", "throughput": 333.13, "total_tokens": 37712672} {"current_steps": 29790, "total_steps": 40000, "loss": 0.0532, "lr": 0.045706181943621985, "epoch": 1.4555737424571862, "percentage": 74.48, "elapsed_time": "1 day, 7:26:50", "remaining_time": "10:46:40", "throughput": 333.18, "total_tokens": 37719104} {"current_steps": 29795, "total_steps": 40000, "loss": 0.0383, "lr": 0.04566385345645344, "epoch": 1.4558180441208806, "percentage": 74.49, "elapsed_time": "1 day, 7:26:53", "remaining_time": "10:46:16", "throughput": 333.22, "total_tokens": 37725504} {"current_steps": 29800, "total_steps": 40000, "loss": 0.0565, "lr": 0.04562154105922993, "epoch": 1.4560623457845747, "percentage": 74.5, "elapsed_time": "1 day, 7:26:56", "remaining_time": "10:45:52", "throughput": 333.28, "total_tokens": 37732672} {"current_steps": 29800, "total_steps": 40000, "eval_loss": 0.06192663684487343, "epoch": 1.4560623457845747, "percentage": 74.5, "elapsed_time": "1 day, 7:37:37", "remaining_time": "10:49:31", "throughput": 331.4, "total_tokens": 37732672} {"current_steps": 29805, "total_steps": 40000, "loss": 0.0468, "lr": 0.04557924475847642, "epoch": 1.456306647448269, "percentage": 74.51, "elapsed_time": "1 day, 7:37:44", "remaining_time": "10:49:07", "throughput": 331.44, "total_tokens": 37738624} {"current_steps": 29810, "total_steps": 40000, "loss": 0.0649, "lr": 0.04553696456071567, "epoch": 1.4565509491119635, "percentage": 74.52, "elapsed_time": "1 day, 7:37:47", "remaining_time": "10:48:43", "throughput": 331.48, "total_tokens": 37745248} {"current_steps": 29815, "total_steps": 40000, "loss": 0.0691, "lr": 0.045494700472467724, "epoch": 1.4567952507756579, "percentage": 74.54, "elapsed_time": "1 day, 7:37:50", "remaining_time": "10:48:18", "throughput": 331.53, "total_tokens": 37751712} {"current_steps": 29820, "total_steps": 40000, "loss": 0.0478, "lr": 0.04545245250025024, "epoch": 1.457039552439352, "percentage": 74.55, "elapsed_time": "1 day, 7:37:53", "remaining_time": "10:47:54", "throughput": 331.58, "total_tokens": 37758080} {"current_steps": 29825, "total_steps": 40000, "loss": 0.0608, "lr": 0.045410220650578384, "epoch": 1.4572838541030464, "percentage": 74.56, "elapsed_time": "1 day, 7:37:56", "remaining_time": "10:47:29", "throughput": 331.62, "total_tokens": 37764288} {"current_steps": 29830, "total_steps": 40000, "loss": 0.0777, "lr": 0.04536800492996492, "epoch": 1.4575281557667408, "percentage": 74.58, "elapsed_time": "1 day, 7:37:59", "remaining_time": "10:47:05", "throughput": 331.67, "total_tokens": 37770784} {"current_steps": 29835, "total_steps": 40000, "loss": 0.0516, "lr": 0.04532580534491994, "epoch": 1.4577724574304352, "percentage": 74.59, "elapsed_time": "1 day, 7:38:02", "remaining_time": "10:46:40", "throughput": 331.72, "total_tokens": 37776800} {"current_steps": 29840, "total_steps": 40000, "loss": 0.0507, "lr": 0.045283621901951183, "epoch": 1.4580167590941295, "percentage": 74.6, "elapsed_time": "1 day, 7:38:05", "remaining_time": "10:46:16", "throughput": 331.76, "total_tokens": 37783008} {"current_steps": 29845, "total_steps": 40000, "loss": 0.0708, "lr": 0.04524145460756393, "epoch": 1.4582610607578237, "percentage": 74.61, "elapsed_time": "1 day, 7:38:08", "remaining_time": "10:45:51", "throughput": 331.81, "total_tokens": 37789280} {"current_steps": 29850, "total_steps": 40000, "loss": 0.0417, "lr": 0.045199303468260794, "epoch": 1.458505362421518, "percentage": 74.62, "elapsed_time": "1 day, 7:38:11", "remaining_time": "10:45:27", "throughput": 331.86, "total_tokens": 37795648} {"current_steps": 29855, "total_steps": 40000, "loss": 0.0499, "lr": 0.04515716849054214, "epoch": 1.4587496640852124, "percentage": 74.64, "elapsed_time": "1 day, 7:38:14", "remaining_time": "10:45:02", "throughput": 331.9, "total_tokens": 37801984} {"current_steps": 29860, "total_steps": 40000, "loss": 0.0762, "lr": 0.04511504968090558, "epoch": 1.4589939657489068, "percentage": 74.65, "elapsed_time": "1 day, 7:38:18", "remaining_time": "10:44:38", "throughput": 331.95, "total_tokens": 37808832} {"current_steps": 29865, "total_steps": 40000, "loss": 0.0464, "lr": 0.04507294704584644, "epoch": 1.459238267412601, "percentage": 74.66, "elapsed_time": "1 day, 7:38:21", "remaining_time": "10:44:13", "throughput": 332.0, "total_tokens": 37815072} {"current_steps": 29870, "total_steps": 40000, "loss": 0.04, "lr": 0.04503086059185749, "epoch": 1.4594825690762954, "percentage": 74.67, "elapsed_time": "1 day, 7:38:24", "remaining_time": "10:43:49", "throughput": 332.05, "total_tokens": 37821792} {"current_steps": 29875, "total_steps": 40000, "loss": 0.0528, "lr": 0.04498879032542893, "epoch": 1.4597268707399897, "percentage": 74.69, "elapsed_time": "1 day, 7:38:27", "remaining_time": "10:43:24", "throughput": 332.1, "total_tokens": 37828384} {"current_steps": 29880, "total_steps": 40000, "loss": 0.0646, "lr": 0.0449467362530486, "epoch": 1.4599711724036841, "percentage": 74.7, "elapsed_time": "1 day, 7:38:30", "remaining_time": "10:43:00", "throughput": 332.14, "total_tokens": 37834624} {"current_steps": 29885, "total_steps": 40000, "loss": 0.0426, "lr": 0.04490469838120171, "epoch": 1.4602154740673785, "percentage": 74.71, "elapsed_time": "1 day, 7:38:33", "remaining_time": "10:42:35", "throughput": 332.19, "total_tokens": 37841088} {"current_steps": 29890, "total_steps": 40000, "loss": 0.0446, "lr": 0.04486267671637101, "epoch": 1.4604597757310727, "percentage": 74.72, "elapsed_time": "1 day, 7:38:36", "remaining_time": "10:42:11", "throughput": 332.24, "total_tokens": 37847200} {"current_steps": 29895, "total_steps": 40000, "loss": 0.0379, "lr": 0.04482067126503683, "epoch": 1.460704077394767, "percentage": 74.74, "elapsed_time": "1 day, 7:38:39", "remaining_time": "10:41:46", "throughput": 332.28, "total_tokens": 37853792} {"current_steps": 29900, "total_steps": 40000, "loss": 0.0597, "lr": 0.04477868203367687, "epoch": 1.4609483790584614, "percentage": 74.75, "elapsed_time": "1 day, 7:38:42", "remaining_time": "10:41:22", "throughput": 332.33, "total_tokens": 37860160} {"current_steps": 29905, "total_steps": 40000, "loss": 0.0507, "lr": 0.044736709028766426, "epoch": 1.4611926807221558, "percentage": 74.76, "elapsed_time": "1 day, 7:38:46", "remaining_time": "10:40:57", "throughput": 332.38, "total_tokens": 37866784} {"current_steps": 29910, "total_steps": 40000, "loss": 0.0505, "lr": 0.04469475225677832, "epoch": 1.46143698238585, "percentage": 74.78, "elapsed_time": "1 day, 7:38:49", "remaining_time": "10:40:33", "throughput": 332.43, "total_tokens": 37873024} {"current_steps": 29915, "total_steps": 40000, "loss": 0.0472, "lr": 0.04465281172418273, "epoch": 1.4616812840495443, "percentage": 74.79, "elapsed_time": "1 day, 7:38:52", "remaining_time": "10:40:09", "throughput": 332.48, "total_tokens": 37879776} {"current_steps": 29920, "total_steps": 40000, "loss": 0.0349, "lr": 0.044610887437447476, "epoch": 1.4619255857132387, "percentage": 74.8, "elapsed_time": "1 day, 7:38:55", "remaining_time": "10:39:44", "throughput": 332.52, "total_tokens": 37886048} {"current_steps": 29925, "total_steps": 40000, "loss": 0.0483, "lr": 0.044568979403037744, "epoch": 1.462169887376933, "percentage": 74.81, "elapsed_time": "1 day, 7:38:58", "remaining_time": "10:39:20", "throughput": 332.57, "total_tokens": 37892416} {"current_steps": 29930, "total_steps": 40000, "loss": 0.0571, "lr": 0.04452708762741631, "epoch": 1.4624141890406275, "percentage": 74.83, "elapsed_time": "1 day, 7:39:01", "remaining_time": "10:38:55", "throughput": 332.62, "total_tokens": 37899072} {"current_steps": 29935, "total_steps": 40000, "loss": 0.0306, "lr": 0.044485212117043475, "epoch": 1.4626584907043216, "percentage": 74.84, "elapsed_time": "1 day, 7:39:04", "remaining_time": "10:38:31", "throughput": 332.66, "total_tokens": 37905120} {"current_steps": 29940, "total_steps": 40000, "loss": 0.0482, "lr": 0.04444335287837687, "epoch": 1.462902792368016, "percentage": 74.85, "elapsed_time": "1 day, 7:39:07", "remaining_time": "10:38:07", "throughput": 332.7, "total_tokens": 37910912} {"current_steps": 29945, "total_steps": 40000, "loss": 0.0661, "lr": 0.04440150991787179, "epoch": 1.4631470940317104, "percentage": 74.86, "elapsed_time": "1 day, 7:39:10", "remaining_time": "10:37:42", "throughput": 332.75, "total_tokens": 37917248} {"current_steps": 29950, "total_steps": 40000, "loss": 0.0633, "lr": 0.04435968324198088, "epoch": 1.4633913956954046, "percentage": 74.88, "elapsed_time": "1 day, 7:39:13", "remaining_time": "10:37:18", "throughput": 332.8, "total_tokens": 37923712} {"current_steps": 29955, "total_steps": 40000, "loss": 0.0645, "lr": 0.04431787285715442, "epoch": 1.463635697359099, "percentage": 74.89, "elapsed_time": "1 day, 7:39:17", "remaining_time": "10:36:53", "throughput": 332.85, "total_tokens": 37930144} {"current_steps": 29960, "total_steps": 40000, "loss": 0.0568, "lr": 0.04427607876984004, "epoch": 1.4638799990227933, "percentage": 74.9, "elapsed_time": "1 day, 7:39:20", "remaining_time": "10:36:29", "throughput": 332.89, "total_tokens": 37936480} {"current_steps": 29965, "total_steps": 40000, "loss": 0.0387, "lr": 0.044234300986482886, "epoch": 1.4641243006864877, "percentage": 74.91, "elapsed_time": "1 day, 7:39:23", "remaining_time": "10:36:05", "throughput": 332.94, "total_tokens": 37942784} {"current_steps": 29970, "total_steps": 40000, "loss": 0.0635, "lr": 0.04419253951352566, "epoch": 1.464368602350182, "percentage": 74.92, "elapsed_time": "1 day, 7:39:26", "remaining_time": "10:35:40", "throughput": 332.98, "total_tokens": 37948864} {"current_steps": 29975, "total_steps": 40000, "loss": 0.0698, "lr": 0.044150794357408533, "epoch": 1.4646129040138764, "percentage": 74.94, "elapsed_time": "1 day, 7:39:29", "remaining_time": "10:35:16", "throughput": 333.02, "total_tokens": 37954368} {"current_steps": 29980, "total_steps": 40000, "loss": 0.0559, "lr": 0.044109065524569065, "epoch": 1.4648572056775706, "percentage": 74.95, "elapsed_time": "1 day, 7:39:32", "remaining_time": "10:34:52", "throughput": 333.07, "total_tokens": 37960320} {"current_steps": 29985, "total_steps": 40000, "loss": 0.0493, "lr": 0.0440673530214424, "epoch": 1.465101507341265, "percentage": 74.96, "elapsed_time": "1 day, 7:39:35", "remaining_time": "10:34:27", "throughput": 333.11, "total_tokens": 37966144} {"current_steps": 29990, "total_steps": 40000, "loss": 0.0705, "lr": 0.04402565685446117, "epoch": 1.4653458090049594, "percentage": 74.98, "elapsed_time": "1 day, 7:39:38", "remaining_time": "10:34:03", "throughput": 333.15, "total_tokens": 37972256} {"current_steps": 29995, "total_steps": 40000, "loss": 0.0991, "lr": 0.04398397703005536, "epoch": 1.4655901106686535, "percentage": 74.99, "elapsed_time": "1 day, 7:39:41", "remaining_time": "10:33:39", "throughput": 333.2, "total_tokens": 37978496} {"current_steps": 30000, "total_steps": 40000, "loss": 0.0536, "lr": 0.043942313554652626, "epoch": 1.465834412332348, "percentage": 75.0, "elapsed_time": "1 day, 7:39:44", "remaining_time": "10:33:14", "throughput": 333.25, "total_tokens": 37984768} {"current_steps": 30000, "total_steps": 40000, "eval_loss": 0.06192677840590477, "epoch": 1.465834412332348, "percentage": 75.0, "elapsed_time": "1 day, 7:50:24", "remaining_time": "10:36:48", "throughput": 331.38, "total_tokens": 37984768} {"current_steps": 30005, "total_steps": 40000, "loss": 0.0525, "lr": 0.0439006664346779, "epoch": 1.4660787139960423, "percentage": 75.01, "elapsed_time": "1 day, 7:50:28", "remaining_time": "10:36:23", "throughput": 331.43, "total_tokens": 37990752} {"current_steps": 30010, "total_steps": 40000, "loss": 0.0608, "lr": 0.043859035676553755, "epoch": 1.4663230156597367, "percentage": 75.02, "elapsed_time": "1 day, 7:50:31", "remaining_time": "10:35:59", "throughput": 331.47, "total_tokens": 37996736} {"current_steps": 30015, "total_steps": 40000, "loss": 0.0966, "lr": 0.043817421286700194, "epoch": 1.466567317323431, "percentage": 75.04, "elapsed_time": "1 day, 7:50:34", "remaining_time": "10:35:35", "throughput": 331.51, "total_tokens": 38002880} {"current_steps": 30020, "total_steps": 40000, "loss": 0.0467, "lr": 0.043775823271534585, "epoch": 1.4668116189871254, "percentage": 75.05, "elapsed_time": "1 day, 7:50:37", "remaining_time": "10:35:10", "throughput": 331.56, "total_tokens": 38009408} {"current_steps": 30025, "total_steps": 40000, "loss": 0.056, "lr": 0.04373424163747197, "epoch": 1.4670559206508196, "percentage": 75.06, "elapsed_time": "1 day, 7:50:40", "remaining_time": "10:34:46", "throughput": 331.61, "total_tokens": 38015904} {"current_steps": 30030, "total_steps": 40000, "loss": 0.0667, "lr": 0.04369267639092473, "epoch": 1.467300222314514, "percentage": 75.08, "elapsed_time": "1 day, 7:50:43", "remaining_time": "10:34:21", "throughput": 331.66, "total_tokens": 38022176} {"current_steps": 30035, "total_steps": 40000, "loss": 0.0569, "lr": 0.04365112753830268, "epoch": 1.4675445239782083, "percentage": 75.09, "elapsed_time": "1 day, 7:50:46", "remaining_time": "10:33:57", "throughput": 331.7, "total_tokens": 38028864} {"current_steps": 30040, "total_steps": 40000, "loss": 0.0512, "lr": 0.04360959508601327, "epoch": 1.4677888256419025, "percentage": 75.1, "elapsed_time": "1 day, 7:50:49", "remaining_time": "10:33:33", "throughput": 331.75, "total_tokens": 38034976} {"current_steps": 30045, "total_steps": 40000, "loss": 0.0527, "lr": 0.04356807904046123, "epoch": 1.4680331273055969, "percentage": 75.11, "elapsed_time": "1 day, 7:50:52", "remaining_time": "10:33:08", "throughput": 331.79, "total_tokens": 38041184} {"current_steps": 30050, "total_steps": 40000, "loss": 0.0471, "lr": 0.04352657940804892, "epoch": 1.4682774289692913, "percentage": 75.12, "elapsed_time": "1 day, 7:50:55", "remaining_time": "10:32:44", "throughput": 331.84, "total_tokens": 38047232} {"current_steps": 30055, "total_steps": 40000, "loss": 0.0633, "lr": 0.04348509619517613, "epoch": 1.4685217306329856, "percentage": 75.14, "elapsed_time": "1 day, 7:50:58", "remaining_time": "10:32:19", "throughput": 331.89, "total_tokens": 38053632} {"current_steps": 30060, "total_steps": 40000, "loss": 0.0608, "lr": 0.04344362940824002, "epoch": 1.46876603229668, "percentage": 75.15, "elapsed_time": "1 day, 7:51:02", "remaining_time": "10:31:55", "throughput": 331.93, "total_tokens": 38060096} {"current_steps": 30065, "total_steps": 40000, "loss": 0.065, "lr": 0.04340217905363533, "epoch": 1.4690103339603744, "percentage": 75.16, "elapsed_time": "1 day, 7:51:05", "remaining_time": "10:31:31", "throughput": 331.98, "total_tokens": 38066304} {"current_steps": 30070, "total_steps": 40000, "loss": 0.0811, "lr": 0.04336074513775425, "epoch": 1.4692546356240686, "percentage": 75.17, "elapsed_time": "1 day, 7:51:08", "remaining_time": "10:31:06", "throughput": 332.02, "total_tokens": 38072256} {"current_steps": 30075, "total_steps": 40000, "loss": 0.0457, "lr": 0.04331932766698636, "epoch": 1.469498937287763, "percentage": 75.19, "elapsed_time": "1 day, 7:51:11", "remaining_time": "10:30:42", "throughput": 332.07, "total_tokens": 38078752} {"current_steps": 30080, "total_steps": 40000, "loss": 0.049, "lr": 0.0432779266477188, "epoch": 1.4697432389514573, "percentage": 75.2, "elapsed_time": "1 day, 7:51:14", "remaining_time": "10:30:18", "throughput": 332.11, "total_tokens": 38084928} {"current_steps": 30085, "total_steps": 40000, "loss": 0.0708, "lr": 0.04323654208633607, "epoch": 1.4699875406151515, "percentage": 75.21, "elapsed_time": "1 day, 7:51:17", "remaining_time": "10:29:53", "throughput": 332.16, "total_tokens": 38091712} {"current_steps": 30090, "total_steps": 40000, "loss": 0.0685, "lr": 0.04319517398922024, "epoch": 1.4702318422788458, "percentage": 75.22, "elapsed_time": "1 day, 7:51:20", "remaining_time": "10:29:29", "throughput": 332.21, "total_tokens": 38098272} {"current_steps": 30095, "total_steps": 40000, "loss": 0.0636, "lr": 0.04315382236275079, "epoch": 1.4704761439425402, "percentage": 75.24, "elapsed_time": "1 day, 7:51:23", "remaining_time": "10:29:05", "throughput": 332.26, "total_tokens": 38104256} {"current_steps": 30100, "total_steps": 40000, "loss": 0.0683, "lr": 0.043112487213304664, "epoch": 1.4707204456062346, "percentage": 75.25, "elapsed_time": "1 day, 7:51:26", "remaining_time": "10:28:40", "throughput": 332.3, "total_tokens": 38110688} {"current_steps": 30105, "total_steps": 40000, "loss": 0.0337, "lr": 0.04307116854725618, "epoch": 1.470964747269929, "percentage": 75.26, "elapsed_time": "1 day, 7:51:29", "remaining_time": "10:28:16", "throughput": 332.35, "total_tokens": 38116800} {"current_steps": 30110, "total_steps": 40000, "loss": 0.0689, "lr": 0.043029866370977325, "epoch": 1.4712090489336234, "percentage": 75.28, "elapsed_time": "1 day, 7:51:32", "remaining_time": "10:27:52", "throughput": 332.39, "total_tokens": 38122944} {"current_steps": 30115, "total_steps": 40000, "loss": 0.0543, "lr": 0.04298858069083728, "epoch": 1.4714533505973175, "percentage": 75.29, "elapsed_time": "1 day, 7:51:35", "remaining_time": "10:27:27", "throughput": 332.44, "total_tokens": 38129056} {"current_steps": 30120, "total_steps": 40000, "loss": 0.0352, "lr": 0.04294731151320295, "epoch": 1.471697652261012, "percentage": 75.3, "elapsed_time": "1 day, 7:51:39", "remaining_time": "10:27:03", "throughput": 332.48, "total_tokens": 38135680} {"current_steps": 30125, "total_steps": 40000, "loss": 0.0747, "lr": 0.04290605884443841, "epoch": 1.4719419539247063, "percentage": 75.31, "elapsed_time": "1 day, 7:51:42", "remaining_time": "10:26:39", "throughput": 332.53, "total_tokens": 38141408} {"current_steps": 30130, "total_steps": 40000, "loss": 0.0326, "lr": 0.04286482269090545, "epoch": 1.4721862555884004, "percentage": 75.33, "elapsed_time": "1 day, 7:51:45", "remaining_time": "10:26:15", "throughput": 332.57, "total_tokens": 38147808} {"current_steps": 30135, "total_steps": 40000, "loss": 0.0446, "lr": 0.04282360305896323, "epoch": 1.4724305572520948, "percentage": 75.34, "elapsed_time": "1 day, 7:51:48", "remaining_time": "10:25:50", "throughput": 332.62, "total_tokens": 38154176} {"current_steps": 30140, "total_steps": 40000, "loss": 0.063, "lr": 0.04278239995496822, "epoch": 1.4726748589157892, "percentage": 75.35, "elapsed_time": "1 day, 7:51:51", "remaining_time": "10:25:26", "throughput": 332.67, "total_tokens": 38160640} {"current_steps": 30145, "total_steps": 40000, "loss": 0.0599, "lr": 0.042741213385274514, "epoch": 1.4729191605794836, "percentage": 75.36, "elapsed_time": "1 day, 7:51:54", "remaining_time": "10:25:02", "throughput": 332.71, "total_tokens": 38166848} {"current_steps": 30150, "total_steps": 40000, "loss": 0.0884, "lr": 0.04270004335623366, "epoch": 1.473163462243178, "percentage": 75.38, "elapsed_time": "1 day, 7:51:57", "remaining_time": "10:24:38", "throughput": 332.75, "total_tokens": 38172704} {"current_steps": 30155, "total_steps": 40000, "loss": 0.0586, "lr": 0.04265888987419448, "epoch": 1.4734077639068723, "percentage": 75.39, "elapsed_time": "1 day, 7:52:00", "remaining_time": "10:24:13", "throughput": 332.81, "total_tokens": 38179616} {"current_steps": 30160, "total_steps": 40000, "loss": 0.0641, "lr": 0.04261775294550346, "epoch": 1.4736520655705665, "percentage": 75.4, "elapsed_time": "1 day, 7:52:03", "remaining_time": "10:23:49", "throughput": 332.85, "total_tokens": 38185824} {"current_steps": 30165, "total_steps": 40000, "loss": 0.0513, "lr": 0.042576632576504354, "epoch": 1.4738963672342609, "percentage": 75.41, "elapsed_time": "1 day, 7:52:06", "remaining_time": "10:23:25", "throughput": 332.9, "total_tokens": 38192288} {"current_steps": 30170, "total_steps": 40000, "loss": 0.0807, "lr": 0.0425355287735385, "epoch": 1.4741406688979553, "percentage": 75.42, "elapsed_time": "1 day, 7:52:10", "remaining_time": "10:23:01", "throughput": 332.95, "total_tokens": 38198816} {"current_steps": 30175, "total_steps": 40000, "loss": 0.0512, "lr": 0.0424944415429446, "epoch": 1.4743849705616494, "percentage": 75.44, "elapsed_time": "1 day, 7:52:13", "remaining_time": "10:22:37", "throughput": 333.0, "total_tokens": 38205632} {"current_steps": 30180, "total_steps": 40000, "loss": 0.0686, "lr": 0.04245337089105877, "epoch": 1.4746292722253438, "percentage": 75.45, "elapsed_time": "1 day, 7:52:16", "remaining_time": "10:22:13", "throughput": 333.04, "total_tokens": 38212064} {"current_steps": 30185, "total_steps": 40000, "loss": 0.0562, "lr": 0.04241231682421467, "epoch": 1.4748735738890382, "percentage": 75.46, "elapsed_time": "1 day, 7:52:19", "remaining_time": "10:21:48", "throughput": 333.09, "total_tokens": 38218272} {"current_steps": 30190, "total_steps": 40000, "loss": 0.0276, "lr": 0.04237127934874337, "epoch": 1.4751178755527325, "percentage": 75.48, "elapsed_time": "1 day, 7:52:22", "remaining_time": "10:21:24", "throughput": 333.13, "total_tokens": 38224576} {"current_steps": 30195, "total_steps": 40000, "loss": 0.0585, "lr": 0.042330258470973305, "epoch": 1.475362177216427, "percentage": 75.49, "elapsed_time": "1 day, 7:52:25", "remaining_time": "10:21:00", "throughput": 333.18, "total_tokens": 38231424} {"current_steps": 30200, "total_steps": 40000, "loss": 0.0665, "lr": 0.042289254197230515, "epoch": 1.4756064788801213, "percentage": 75.5, "elapsed_time": "1 day, 7:52:28", "remaining_time": "10:20:36", "throughput": 333.22, "total_tokens": 38237120} {"current_steps": 30200, "total_steps": 40000, "eval_loss": 0.06344887614250183, "epoch": 1.4756064788801213, "percentage": 75.5, "elapsed_time": "1 day, 8:03:08", "remaining_time": "10:24:04", "throughput": 331.38, "total_tokens": 38237120} {"current_steps": 30205, "total_steps": 40000, "loss": 0.0418, "lr": 0.04224826653383823, "epoch": 1.4758507805438155, "percentage": 75.51, "elapsed_time": "1 day, 8:03:12", "remaining_time": "10:23:40", "throughput": 331.42, "total_tokens": 38243392} {"current_steps": 30210, "total_steps": 40000, "loss": 0.0632, "lr": 0.04220729548711735, "epoch": 1.4760950822075098, "percentage": 75.52, "elapsed_time": "1 day, 8:03:15", "remaining_time": "10:23:15", "throughput": 331.46, "total_tokens": 38249568} {"current_steps": 30215, "total_steps": 40000, "loss": 0.0468, "lr": 0.04216634106338616, "epoch": 1.4763393838712042, "percentage": 75.54, "elapsed_time": "1 day, 8:03:18", "remaining_time": "10:22:51", "throughput": 331.51, "total_tokens": 38255936} {"current_steps": 30220, "total_steps": 40000, "loss": 0.0485, "lr": 0.04212540326896025, "epoch": 1.4765836855348984, "percentage": 75.55, "elapsed_time": "1 day, 8:03:21", "remaining_time": "10:22:27", "throughput": 331.56, "total_tokens": 38262176} {"current_steps": 30225, "total_steps": 40000, "loss": 0.0434, "lr": 0.0420844821101528, "epoch": 1.4768279871985928, "percentage": 75.56, "elapsed_time": "1 day, 8:03:24", "remaining_time": "10:22:02", "throughput": 331.6, "total_tokens": 38268416} {"current_steps": 30230, "total_steps": 40000, "loss": 0.0489, "lr": 0.04204357759327441, "epoch": 1.4770722888622871, "percentage": 75.58, "elapsed_time": "1 day, 8:03:28", "remaining_time": "10:21:38", "throughput": 331.65, "total_tokens": 38274848} {"current_steps": 30235, "total_steps": 40000, "loss": 0.0689, "lr": 0.042002689724632954, "epoch": 1.4773165905259815, "percentage": 75.59, "elapsed_time": "1 day, 8:03:31", "remaining_time": "10:21:14", "throughput": 331.69, "total_tokens": 38280928} {"current_steps": 30240, "total_steps": 40000, "loss": 0.0912, "lr": 0.04196181851053398, "epoch": 1.477560892189676, "percentage": 75.6, "elapsed_time": "1 day, 8:03:34", "remaining_time": "10:20:50", "throughput": 331.74, "total_tokens": 38287104} {"current_steps": 30245, "total_steps": 40000, "loss": 0.0506, "lr": 0.041920963957280295, "epoch": 1.47780519385337, "percentage": 75.61, "elapsed_time": "1 day, 8:03:37", "remaining_time": "10:20:25", "throughput": 331.78, "total_tokens": 38293376} {"current_steps": 30250, "total_steps": 40000, "loss": 0.0518, "lr": 0.04188012607117212, "epoch": 1.4780494955170644, "percentage": 75.62, "elapsed_time": "1 day, 8:03:40", "remaining_time": "10:20:01", "throughput": 331.83, "total_tokens": 38300096} {"current_steps": 30255, "total_steps": 40000, "loss": 0.0847, "lr": 0.04183930485850725, "epoch": 1.4782937971807588, "percentage": 75.64, "elapsed_time": "1 day, 8:03:43", "remaining_time": "10:19:37", "throughput": 331.88, "total_tokens": 38306464} {"current_steps": 30260, "total_steps": 40000, "loss": 0.044, "lr": 0.04179850032558078, "epoch": 1.4785380988444532, "percentage": 75.65, "elapsed_time": "1 day, 8:03:46", "remaining_time": "10:19:13", "throughput": 331.92, "total_tokens": 38312864} {"current_steps": 30265, "total_steps": 40000, "loss": 0.0644, "lr": 0.041757712478685295, "epoch": 1.4787824005081474, "percentage": 75.66, "elapsed_time": "1 day, 8:03:49", "remaining_time": "10:18:48", "throughput": 331.97, "total_tokens": 38319264} {"current_steps": 30270, "total_steps": 40000, "loss": 0.0282, "lr": 0.04171694132411085, "epoch": 1.4790267021718417, "percentage": 75.67, "elapsed_time": "1 day, 8:03:52", "remaining_time": "10:18:24", "throughput": 332.02, "total_tokens": 38325568} {"current_steps": 30275, "total_steps": 40000, "loss": 0.0822, "lr": 0.04167618686814479, "epoch": 1.4792710038355361, "percentage": 75.69, "elapsed_time": "1 day, 8:03:55", "remaining_time": "10:18:00", "throughput": 332.06, "total_tokens": 38331488} {"current_steps": 30280, "total_steps": 40000, "loss": 0.0357, "lr": 0.041635449117072024, "epoch": 1.4795153054992305, "percentage": 75.7, "elapsed_time": "1 day, 8:03:58", "remaining_time": "10:17:36", "throughput": 332.1, "total_tokens": 38337632} {"current_steps": 30285, "total_steps": 40000, "loss": 0.06, "lr": 0.04159472807717477, "epoch": 1.4797596071629249, "percentage": 75.71, "elapsed_time": "1 day, 8:04:01", "remaining_time": "10:17:12", "throughput": 332.15, "total_tokens": 38343840} {"current_steps": 30290, "total_steps": 40000, "loss": 0.0503, "lr": 0.041554023754732744, "epoch": 1.480003908826619, "percentage": 75.72, "elapsed_time": "1 day, 8:04:04", "remaining_time": "10:16:47", "throughput": 332.2, "total_tokens": 38350528} {"current_steps": 30295, "total_steps": 40000, "loss": 0.0631, "lr": 0.04151333615602311, "epoch": 1.4802482104903134, "percentage": 75.74, "elapsed_time": "1 day, 8:04:08", "remaining_time": "10:16:23", "throughput": 332.24, "total_tokens": 38356928} {"current_steps": 30300, "total_steps": 40000, "loss": 0.056, "lr": 0.04147266528732034, "epoch": 1.4804925121540078, "percentage": 75.75, "elapsed_time": "1 day, 8:04:11", "remaining_time": "10:15:59", "throughput": 332.29, "total_tokens": 38362880} {"current_steps": 30305, "total_steps": 40000, "loss": 0.0511, "lr": 0.0414320111548964, "epoch": 1.4807368138177022, "percentage": 75.76, "elapsed_time": "1 day, 8:04:14", "remaining_time": "10:15:35", "throughput": 332.33, "total_tokens": 38369120} {"current_steps": 30310, "total_steps": 40000, "loss": 0.0375, "lr": 0.04139137376502076, "epoch": 1.4809811154813963, "percentage": 75.78, "elapsed_time": "1 day, 8:04:17", "remaining_time": "10:15:11", "throughput": 332.38, "total_tokens": 38375328} {"current_steps": 30315, "total_steps": 40000, "loss": 0.0586, "lr": 0.04135075312396014, "epoch": 1.4812254171450907, "percentage": 75.79, "elapsed_time": "1 day, 8:04:20", "remaining_time": "10:14:47", "throughput": 332.43, "total_tokens": 38382368} {"current_steps": 30320, "total_steps": 40000, "loss": 0.0599, "lr": 0.04131014923797875, "epoch": 1.481469718808785, "percentage": 75.8, "elapsed_time": "1 day, 8:04:23", "remaining_time": "10:14:22", "throughput": 332.47, "total_tokens": 38388640} {"current_steps": 30325, "total_steps": 40000, "loss": 0.0631, "lr": 0.04126956211333819, "epoch": 1.4817140204724795, "percentage": 75.81, "elapsed_time": "1 day, 8:04:26", "remaining_time": "10:13:58", "throughput": 332.52, "total_tokens": 38395008} {"current_steps": 30330, "total_steps": 40000, "loss": 0.0859, "lr": 0.041228991756297545, "epoch": 1.4819583221361738, "percentage": 75.83, "elapsed_time": "1 day, 8:04:29", "remaining_time": "10:13:34", "throughput": 332.57, "total_tokens": 38401216} {"current_steps": 30335, "total_steps": 40000, "loss": 0.0496, "lr": 0.04118843817311332, "epoch": 1.482202623799868, "percentage": 75.84, "elapsed_time": "1 day, 8:04:32", "remaining_time": "10:13:10", "throughput": 332.61, "total_tokens": 38407744} {"current_steps": 30340, "total_steps": 40000, "loss": 0.051, "lr": 0.0411479013700393, "epoch": 1.4824469254635624, "percentage": 75.85, "elapsed_time": "1 day, 8:04:35", "remaining_time": "10:12:46", "throughput": 332.66, "total_tokens": 38414400} {"current_steps": 30345, "total_steps": 40000, "loss": 0.0562, "lr": 0.0411073813533268, "epoch": 1.4826912271272568, "percentage": 75.86, "elapsed_time": "1 day, 8:04:38", "remaining_time": "10:12:22", "throughput": 332.71, "total_tokens": 38420608} {"current_steps": 30350, "total_steps": 40000, "loss": 0.0544, "lr": 0.04106687812922456, "epoch": 1.4829355287909511, "percentage": 75.88, "elapsed_time": "1 day, 8:04:42", "remaining_time": "10:11:58", "throughput": 332.76, "total_tokens": 38427392} {"current_steps": 30355, "total_steps": 40000, "loss": 0.066, "lr": 0.041026391703978635, "epoch": 1.4831798304546453, "percentage": 75.89, "elapsed_time": "1 day, 8:04:45", "remaining_time": "10:11:34", "throughput": 332.8, "total_tokens": 38433952} {"current_steps": 30360, "total_steps": 40000, "loss": 0.0634, "lr": 0.04098592208383259, "epoch": 1.4834241321183397, "percentage": 75.9, "elapsed_time": "1 day, 8:04:48", "remaining_time": "10:11:10", "throughput": 332.85, "total_tokens": 38439936} {"current_steps": 30365, "total_steps": 40000, "loss": 0.0582, "lr": 0.040945469275027256, "epoch": 1.483668433782034, "percentage": 75.91, "elapsed_time": "1 day, 8:04:51", "remaining_time": "10:10:46", "throughput": 332.89, "total_tokens": 38445952} {"current_steps": 30370, "total_steps": 40000, "loss": 0.0804, "lr": 0.04090503328380104, "epoch": 1.4839127354457284, "percentage": 75.92, "elapsed_time": "1 day, 8:04:54", "remaining_time": "10:10:22", "throughput": 332.93, "total_tokens": 38452128} {"current_steps": 30375, "total_steps": 40000, "loss": 0.0458, "lr": 0.04086461411638971, "epoch": 1.4841570371094228, "percentage": 75.94, "elapsed_time": "1 day, 8:04:57", "remaining_time": "10:09:57", "throughput": 332.98, "total_tokens": 38458560} {"current_steps": 30380, "total_steps": 40000, "loss": 0.0703, "lr": 0.04082421177902631, "epoch": 1.484401338773117, "percentage": 75.95, "elapsed_time": "1 day, 8:05:00", "remaining_time": "10:09:33", "throughput": 333.03, "total_tokens": 38464960} {"current_steps": 30385, "total_steps": 40000, "loss": 0.0625, "lr": 0.04078382627794149, "epoch": 1.4846456404368114, "percentage": 75.96, "elapsed_time": "1 day, 8:05:03", "remaining_time": "10:09:09", "throughput": 333.07, "total_tokens": 38471200} {"current_steps": 30390, "total_steps": 40000, "loss": 0.0461, "lr": 0.04074345761936316, "epoch": 1.4848899421005057, "percentage": 75.98, "elapsed_time": "1 day, 8:05:06", "remaining_time": "10:08:45", "throughput": 333.12, "total_tokens": 38477344} {"current_steps": 30395, "total_steps": 40000, "loss": 0.0304, "lr": 0.04070310580951663, "epoch": 1.4851342437642001, "percentage": 75.99, "elapsed_time": "1 day, 8:05:09", "remaining_time": "10:08:21", "throughput": 333.16, "total_tokens": 38483712} {"current_steps": 30400, "total_steps": 40000, "loss": 0.0469, "lr": 0.040662770854624726, "epoch": 1.4853785454278943, "percentage": 76.0, "elapsed_time": "1 day, 8:05:13", "remaining_time": "10:07:57", "throughput": 333.21, "total_tokens": 38490112} {"current_steps": 30400, "total_steps": 40000, "eval_loss": 0.06272178143262863, "epoch": 1.4853785454278943, "percentage": 76.0, "elapsed_time": "1 day, 8:15:52", "remaining_time": "10:11:19", "throughput": 331.37, "total_tokens": 38490112} {"current_steps": 30405, "total_steps": 40000, "loss": 0.0538, "lr": 0.040622452760907535, "epoch": 1.4856228470915886, "percentage": 76.01, "elapsed_time": "1 day, 8:15:56", "remaining_time": "10:10:55", "throughput": 331.42, "total_tokens": 38496096} {"current_steps": 30410, "total_steps": 40000, "loss": 0.07, "lr": 0.04058215153458265, "epoch": 1.485867148755283, "percentage": 76.02, "elapsed_time": "1 day, 8:15:59", "remaining_time": "10:10:31", "throughput": 331.46, "total_tokens": 38502240} {"current_steps": 30415, "total_steps": 40000, "loss": 0.0572, "lr": 0.04054186718186507, "epoch": 1.4861114504189774, "percentage": 76.04, "elapsed_time": "1 day, 8:16:02", "remaining_time": "10:10:07", "throughput": 331.5, "total_tokens": 38508448} {"current_steps": 30420, "total_steps": 40000, "loss": 0.0426, "lr": 0.04050159970896708, "epoch": 1.4863557520826718, "percentage": 76.05, "elapsed_time": "1 day, 8:16:05", "remaining_time": "10:09:43", "throughput": 331.55, "total_tokens": 38514432} {"current_steps": 30425, "total_steps": 40000, "loss": 0.0651, "lr": 0.04046134912209843, "epoch": 1.486600053746366, "percentage": 76.06, "elapsed_time": "1 day, 8:16:08", "remaining_time": "10:09:19", "throughput": 331.59, "total_tokens": 38520736} {"current_steps": 30430, "total_steps": 40000, "loss": 0.089, "lr": 0.040421115427466354, "epoch": 1.4868443554100603, "percentage": 76.08, "elapsed_time": "1 day, 8:16:11", "remaining_time": "10:08:55", "throughput": 331.63, "total_tokens": 38526624} {"current_steps": 30435, "total_steps": 40000, "loss": 0.0497, "lr": 0.04038089863127529, "epoch": 1.4870886570737547, "percentage": 76.09, "elapsed_time": "1 day, 8:16:15", "remaining_time": "10:08:31", "throughput": 331.68, "total_tokens": 38533376} {"current_steps": 30440, "total_steps": 40000, "loss": 0.0656, "lr": 0.04034069873972727, "epoch": 1.487332958737449, "percentage": 76.1, "elapsed_time": "1 day, 8:16:18", "remaining_time": "10:08:06", "throughput": 331.73, "total_tokens": 38540192} {"current_steps": 30445, "total_steps": 40000, "loss": 0.063, "lr": 0.040300515759021514, "epoch": 1.4875772604011432, "percentage": 76.11, "elapsed_time": "1 day, 8:16:21", "remaining_time": "10:07:42", "throughput": 331.78, "total_tokens": 38546432} {"current_steps": 30450, "total_steps": 40000, "loss": 0.0451, "lr": 0.04026034969535478, "epoch": 1.4878215620648376, "percentage": 76.12, "elapsed_time": "1 day, 8:16:24", "remaining_time": "10:07:18", "throughput": 331.83, "total_tokens": 38552928} {"current_steps": 30455, "total_steps": 40000, "loss": 0.0412, "lr": 0.040220200554921266, "epoch": 1.488065863728532, "percentage": 76.14, "elapsed_time": "1 day, 8:16:27", "remaining_time": "10:06:54", "throughput": 331.87, "total_tokens": 38559584} {"current_steps": 30460, "total_steps": 40000, "loss": 0.0773, "lr": 0.0401800683439124, "epoch": 1.4883101653922264, "percentage": 76.15, "elapsed_time": "1 day, 8:16:30", "remaining_time": "10:06:30", "throughput": 331.92, "total_tokens": 38565696} {"current_steps": 30465, "total_steps": 40000, "loss": 0.0483, "lr": 0.04013995306851704, "epoch": 1.4885544670559208, "percentage": 76.16, "elapsed_time": "1 day, 8:16:33", "remaining_time": "10:06:06", "throughput": 331.97, "total_tokens": 38572416} {"current_steps": 30470, "total_steps": 40000, "loss": 0.0385, "lr": 0.040099854734921545, "epoch": 1.488798768719615, "percentage": 76.17, "elapsed_time": "1 day, 8:16:37", "remaining_time": "10:05:42", "throughput": 332.01, "total_tokens": 38579040} {"current_steps": 30475, "total_steps": 40000, "loss": 0.0696, "lr": 0.0400597733493095, "epoch": 1.4890430703833093, "percentage": 76.19, "elapsed_time": "1 day, 8:16:39", "remaining_time": "10:05:18", "throughput": 332.06, "total_tokens": 38584864} {"current_steps": 30480, "total_steps": 40000, "loss": 0.0542, "lr": 0.04001970891786203, "epoch": 1.4892873720470037, "percentage": 76.2, "elapsed_time": "1 day, 8:16:43", "remaining_time": "10:04:54", "throughput": 332.1, "total_tokens": 38591616} {"current_steps": 30485, "total_steps": 40000, "loss": 0.0593, "lr": 0.03997966144675752, "epoch": 1.4895316737106978, "percentage": 76.21, "elapsed_time": "1 day, 8:16:46", "remaining_time": "10:04:30", "throughput": 332.15, "total_tokens": 38598048} {"current_steps": 30490, "total_steps": 40000, "loss": 0.0608, "lr": 0.039939630942171796, "epoch": 1.4897759753743922, "percentage": 76.22, "elapsed_time": "1 day, 8:16:49", "remaining_time": "10:04:06", "throughput": 332.2, "total_tokens": 38604544} {"current_steps": 30495, "total_steps": 40000, "loss": 0.036, "lr": 0.03989961741027815, "epoch": 1.4900202770380866, "percentage": 76.24, "elapsed_time": "1 day, 8:16:52", "remaining_time": "10:03:42", "throughput": 332.25, "total_tokens": 38611072} {"current_steps": 30500, "total_steps": 40000, "loss": 0.0811, "lr": 0.03985962085724704, "epoch": 1.490264578701781, "percentage": 76.25, "elapsed_time": "1 day, 8:16:55", "remaining_time": "10:03:18", "throughput": 332.29, "total_tokens": 38617408} {"current_steps": 30505, "total_steps": 40000, "loss": 0.0651, "lr": 0.03981964128924656, "epoch": 1.4905088803654754, "percentage": 76.26, "elapsed_time": "1 day, 8:16:58", "remaining_time": "10:02:54", "throughput": 332.33, "total_tokens": 38623328} {"current_steps": 30510, "total_steps": 40000, "loss": 0.0386, "lr": 0.03977967871244197, "epoch": 1.4907531820291697, "percentage": 76.28, "elapsed_time": "1 day, 8:17:01", "remaining_time": "10:02:30", "throughput": 332.38, "total_tokens": 38629632} {"current_steps": 30515, "total_steps": 40000, "loss": 0.0859, "lr": 0.03973973313299602, "epoch": 1.490997483692864, "percentage": 76.29, "elapsed_time": "1 day, 8:17:04", "remaining_time": "10:02:06", "throughput": 332.42, "total_tokens": 38635776} {"current_steps": 30520, "total_steps": 40000, "loss": 0.0875, "lr": 0.0396998045570689, "epoch": 1.4912417853565583, "percentage": 76.3, "elapsed_time": "1 day, 8:17:07", "remaining_time": "10:01:42", "throughput": 332.47, "total_tokens": 38641888} {"current_steps": 30525, "total_steps": 40000, "loss": 0.083, "lr": 0.03965989299081798, "epoch": 1.4914860870202526, "percentage": 76.31, "elapsed_time": "1 day, 8:17:10", "remaining_time": "10:01:18", "throughput": 332.51, "total_tokens": 38648320} {"current_steps": 30530, "total_steps": 40000, "loss": 0.0489, "lr": 0.039619998440398235, "epoch": 1.4917303886839468, "percentage": 76.33, "elapsed_time": "1 day, 8:17:13", "remaining_time": "10:00:54", "throughput": 332.56, "total_tokens": 38654432} {"current_steps": 30535, "total_steps": 40000, "loss": 0.0374, "lr": 0.03958012091196184, "epoch": 1.4919746903476412, "percentage": 76.34, "elapsed_time": "1 day, 8:17:17", "remaining_time": "10:00:30", "throughput": 332.6, "total_tokens": 38661024} {"current_steps": 30540, "total_steps": 40000, "loss": 0.0379, "lr": 0.039540260411658396, "epoch": 1.4922189920113356, "percentage": 76.35, "elapsed_time": "1 day, 8:17:20", "remaining_time": "10:00:06", "throughput": 332.65, "total_tokens": 38667136} {"current_steps": 30545, "total_steps": 40000, "loss": 0.0543, "lr": 0.03950041694563496, "epoch": 1.49246329367503, "percentage": 76.36, "elapsed_time": "1 day, 8:17:23", "remaining_time": "9:59:42", "throughput": 332.7, "total_tokens": 38673600} {"current_steps": 30550, "total_steps": 40000, "loss": 0.0401, "lr": 0.0394605905200358, "epoch": 1.4927075953387243, "percentage": 76.38, "elapsed_time": "1 day, 8:17:26", "remaining_time": "9:59:18", "throughput": 332.74, "total_tokens": 38679616} {"current_steps": 30555, "total_steps": 40000, "loss": 0.0589, "lr": 0.03942078114100272, "epoch": 1.4929518970024187, "percentage": 76.39, "elapsed_time": "1 day, 8:17:29", "remaining_time": "9:58:54", "throughput": 332.78, "total_tokens": 38685824} {"current_steps": 30560, "total_steps": 40000, "loss": 0.0669, "lr": 0.03938098881467485, "epoch": 1.4931961986661129, "percentage": 76.4, "elapsed_time": "1 day, 8:17:32", "remaining_time": "9:58:30", "throughput": 332.83, "total_tokens": 38692224} {"current_steps": 30565, "total_steps": 40000, "loss": 0.0402, "lr": 0.039341213547188586, "epoch": 1.4934405003298072, "percentage": 76.41, "elapsed_time": "1 day, 8:17:35", "remaining_time": "9:58:06", "throughput": 332.88, "total_tokens": 38699232} {"current_steps": 30570, "total_steps": 40000, "loss": 0.0427, "lr": 0.03930145534467782, "epoch": 1.4936848019935016, "percentage": 76.42, "elapsed_time": "1 day, 8:17:38", "remaining_time": "9:57:42", "throughput": 332.93, "total_tokens": 38705696} {"current_steps": 30575, "total_steps": 40000, "loss": 0.0603, "lr": 0.0392617142132738, "epoch": 1.4939291036571958, "percentage": 76.44, "elapsed_time": "1 day, 8:17:41", "remaining_time": "9:57:18", "throughput": 332.97, "total_tokens": 38711616} {"current_steps": 30580, "total_steps": 40000, "loss": 0.0523, "lr": 0.03922199015910504, "epoch": 1.4941734053208902, "percentage": 76.45, "elapsed_time": "1 day, 8:17:44", "remaining_time": "9:56:54", "throughput": 333.01, "total_tokens": 38717504} {"current_steps": 30585, "total_steps": 40000, "loss": 0.0583, "lr": 0.039182283188297556, "epoch": 1.4944177069845845, "percentage": 76.46, "elapsed_time": "1 day, 8:17:47", "remaining_time": "9:56:30", "throughput": 333.06, "total_tokens": 38724000} {"current_steps": 30590, "total_steps": 40000, "loss": 0.071, "lr": 0.039142593306974595, "epoch": 1.494662008648279, "percentage": 76.48, "elapsed_time": "1 day, 8:17:50", "remaining_time": "9:56:06", "throughput": 333.1, "total_tokens": 38730336} {"current_steps": 30595, "total_steps": 40000, "loss": 0.0385, "lr": 0.039102920521256856, "epoch": 1.4949063103119733, "percentage": 76.49, "elapsed_time": "1 day, 8:17:53", "remaining_time": "9:55:42", "throughput": 333.15, "total_tokens": 38736352} {"current_steps": 30600, "total_steps": 40000, "loss": 0.0572, "lr": 0.03906326483726243, "epoch": 1.4951506119756677, "percentage": 76.5, "elapsed_time": "1 day, 8:17:57", "remaining_time": "9:55:19", "throughput": 333.19, "total_tokens": 38742560} {"current_steps": 30600, "total_steps": 40000, "eval_loss": 0.06201574578881264, "epoch": 1.4951506119756677, "percentage": 76.5, "elapsed_time": "1 day, 8:28:36", "remaining_time": "9:58:35", "throughput": 331.37, "total_tokens": 38742560} {"current_steps": 30605, "total_steps": 40000, "loss": 0.0463, "lr": 0.039023626261106704, "epoch": 1.4953949136393618, "percentage": 76.51, "elapsed_time": "1 day, 8:28:40", "remaining_time": "9:58:11", "throughput": 331.42, "total_tokens": 38749408} {"current_steps": 30610, "total_steps": 40000, "loss": 0.0579, "lr": 0.03898400479890237, "epoch": 1.4956392153030562, "percentage": 76.53, "elapsed_time": "1 day, 8:28:43", "remaining_time": "9:57:47", "throughput": 331.46, "total_tokens": 38755840} {"current_steps": 30615, "total_steps": 40000, "loss": 0.064, "lr": 0.038944400456759655, "epoch": 1.4958835169667506, "percentage": 76.54, "elapsed_time": "1 day, 8:28:47", "remaining_time": "9:57:23", "throughput": 331.51, "total_tokens": 38762272} {"current_steps": 30620, "total_steps": 40000, "loss": 0.0511, "lr": 0.038904813240785964, "epoch": 1.4961278186304448, "percentage": 76.55, "elapsed_time": "1 day, 8:28:50", "remaining_time": "9:56:59", "throughput": 331.55, "total_tokens": 38768576} {"current_steps": 30625, "total_steps": 40000, "loss": 0.037, "lr": 0.03886524315708621, "epoch": 1.4963721202941391, "percentage": 76.56, "elapsed_time": "1 day, 8:28:53", "remaining_time": "9:56:35", "throughput": 331.6, "total_tokens": 38775040} {"current_steps": 30630, "total_steps": 40000, "loss": 0.0725, "lr": 0.03882569021176255, "epoch": 1.4966164219578335, "percentage": 76.58, "elapsed_time": "1 day, 8:28:56", "remaining_time": "9:56:11", "throughput": 331.65, "total_tokens": 38781536} {"current_steps": 30635, "total_steps": 40000, "loss": 0.056, "lr": 0.038786154410914535, "epoch": 1.4968607236215279, "percentage": 76.59, "elapsed_time": "1 day, 8:28:59", "remaining_time": "9:55:47", "throughput": 331.69, "total_tokens": 38787744} {"current_steps": 30640, "total_steps": 40000, "loss": 0.0387, "lr": 0.03874663576063917, "epoch": 1.4971050252852223, "percentage": 76.6, "elapsed_time": "1 day, 8:29:02", "remaining_time": "9:55:23", "throughput": 331.74, "total_tokens": 38794112} {"current_steps": 30645, "total_steps": 40000, "loss": 0.0408, "lr": 0.038707134267030624, "epoch": 1.4973493269489166, "percentage": 76.61, "elapsed_time": "1 day, 8:29:05", "remaining_time": "9:55:00", "throughput": 331.79, "total_tokens": 38800864} {"current_steps": 30650, "total_steps": 40000, "loss": 0.0436, "lr": 0.038667649936180555, "epoch": 1.4975936286126108, "percentage": 76.62, "elapsed_time": "1 day, 8:29:08", "remaining_time": "9:54:36", "throughput": 331.83, "total_tokens": 38807328} {"current_steps": 30655, "total_steps": 40000, "loss": 0.0664, "lr": 0.038628182774178, "epoch": 1.4978379302763052, "percentage": 76.64, "elapsed_time": "1 day, 8:29:11", "remaining_time": "9:54:12", "throughput": 331.87, "total_tokens": 38813344} {"current_steps": 30660, "total_steps": 40000, "loss": 0.0435, "lr": 0.038588732787109226, "epoch": 1.4980822319399996, "percentage": 76.65, "elapsed_time": "1 day, 8:29:14", "remaining_time": "9:53:48", "throughput": 331.92, "total_tokens": 38819488} {"current_steps": 30665, "total_steps": 40000, "loss": 0.04, "lr": 0.03854929998105795, "epoch": 1.4983265336036937, "percentage": 76.66, "elapsed_time": "1 day, 8:29:17", "remaining_time": "9:53:24", "throughput": 331.96, "total_tokens": 38825760} {"current_steps": 30670, "total_steps": 40000, "loss": 0.0403, "lr": 0.03850988436210518, "epoch": 1.498570835267388, "percentage": 76.68, "elapsed_time": "1 day, 8:29:21", "remaining_time": "9:53:00", "throughput": 332.01, "total_tokens": 38832128} {"current_steps": 30675, "total_steps": 40000, "loss": 0.0689, "lr": 0.03847048593632933, "epoch": 1.4988151369310825, "percentage": 76.69, "elapsed_time": "1 day, 8:29:24", "remaining_time": "9:52:36", "throughput": 332.05, "total_tokens": 38838112} {"current_steps": 30680, "total_steps": 40000, "loss": 0.0649, "lr": 0.038431104709806096, "epoch": 1.4990594385947769, "percentage": 76.7, "elapsed_time": "1 day, 8:29:27", "remaining_time": "9:52:12", "throughput": 332.1, "total_tokens": 38844512} {"current_steps": 30685, "total_steps": 40000, "loss": 0.0461, "lr": 0.0383917406886086, "epoch": 1.4993037402584712, "percentage": 76.71, "elapsed_time": "1 day, 8:29:30", "remaining_time": "9:51:48", "throughput": 332.14, "total_tokens": 38850368} {"current_steps": 30690, "total_steps": 40000, "loss": 0.0723, "lr": 0.03835239387880722, "epoch": 1.4995480419221656, "percentage": 76.72, "elapsed_time": "1 day, 8:29:33", "remaining_time": "9:51:24", "throughput": 332.18, "total_tokens": 38856480} {"current_steps": 30695, "total_steps": 40000, "loss": 0.0952, "lr": 0.03831306428646979, "epoch": 1.4997923435858598, "percentage": 76.74, "elapsed_time": "1 day, 8:29:36", "remaining_time": "9:51:00", "throughput": 332.23, "total_tokens": 38862912} {"current_steps": 30700, "total_steps": 40000, "loss": 0.0584, "lr": 0.03827375191766135, "epoch": 1.5000366452495542, "percentage": 76.75, "elapsed_time": "1 day, 8:29:39", "remaining_time": "9:50:36", "throughput": 332.27, "total_tokens": 38869344} {"current_steps": 30705, "total_steps": 40000, "loss": 0.0872, "lr": 0.03823445677844446, "epoch": 1.5002809469132483, "percentage": 76.76, "elapsed_time": "1 day, 8:29:42", "remaining_time": "9:50:12", "throughput": 332.32, "total_tokens": 38875392} {"current_steps": 30710, "total_steps": 40000, "loss": 0.0864, "lr": 0.03819517887487881, "epoch": 1.5005252485769427, "percentage": 76.78, "elapsed_time": "1 day, 8:29:45", "remaining_time": "9:49:48", "throughput": 332.36, "total_tokens": 38881696} {"current_steps": 30715, "total_steps": 40000, "loss": 0.0584, "lr": 0.03815591821302161, "epoch": 1.500769550240637, "percentage": 76.79, "elapsed_time": "1 day, 8:29:48", "remaining_time": "9:49:25", "throughput": 332.41, "total_tokens": 38887680} {"current_steps": 30720, "total_steps": 40000, "loss": 0.0747, "lr": 0.03811667479892739, "epoch": 1.5010138519043315, "percentage": 76.8, "elapsed_time": "1 day, 8:29:51", "remaining_time": "9:49:01", "throughput": 332.45, "total_tokens": 38894016} {"current_steps": 30725, "total_steps": 40000, "loss": 0.0602, "lr": 0.03807744863864788, "epoch": 1.5012581535680258, "percentage": 76.81, "elapsed_time": "1 day, 8:29:54", "remaining_time": "9:48:37", "throughput": 332.5, "total_tokens": 38901056} {"current_steps": 30730, "total_steps": 40000, "loss": 0.0841, "lr": 0.03803823973823229, "epoch": 1.5015024552317202, "percentage": 76.83, "elapsed_time": "1 day, 8:29:58", "remaining_time": "9:48:13", "throughput": 332.55, "total_tokens": 38907328} {"current_steps": 30735, "total_steps": 40000, "loss": 0.0672, "lr": 0.03799904810372719, "epoch": 1.5017467568954146, "percentage": 76.84, "elapsed_time": "1 day, 8:30:01", "remaining_time": "9:47:49", "throughput": 332.59, "total_tokens": 38913856} {"current_steps": 30740, "total_steps": 40000, "loss": 0.0335, "lr": 0.03795987374117632, "epoch": 1.5019910585591087, "percentage": 76.85, "elapsed_time": "1 day, 8:30:04", "remaining_time": "9:47:25", "throughput": 332.64, "total_tokens": 38919840} {"current_steps": 30745, "total_steps": 40000, "loss": 0.0442, "lr": 0.03792071665662093, "epoch": 1.5022353602228031, "percentage": 76.86, "elapsed_time": "1 day, 8:30:07", "remaining_time": "9:47:02", "throughput": 332.68, "total_tokens": 38926048} {"current_steps": 30750, "total_steps": 40000, "loss": 0.0379, "lr": 0.03788157685609952, "epoch": 1.5024796618864973, "percentage": 76.88, "elapsed_time": "1 day, 8:30:10", "remaining_time": "9:46:38", "throughput": 332.72, "total_tokens": 38931840} {"current_steps": 30755, "total_steps": 40000, "loss": 0.0757, "lr": 0.037842454345647876, "epoch": 1.5027239635501917, "percentage": 76.89, "elapsed_time": "1 day, 8:30:13", "remaining_time": "9:46:14", "throughput": 332.77, "total_tokens": 38938048} {"current_steps": 30760, "total_steps": 40000, "loss": 0.046, "lr": 0.03780334913129929, "epoch": 1.502968265213886, "percentage": 76.9, "elapsed_time": "1 day, 8:30:16", "remaining_time": "9:45:50", "throughput": 332.81, "total_tokens": 38943936} {"current_steps": 30765, "total_steps": 40000, "loss": 0.068, "lr": 0.037764261219084175, "epoch": 1.5032125668775804, "percentage": 76.91, "elapsed_time": "1 day, 8:30:19", "remaining_time": "9:45:26", "throughput": 332.85, "total_tokens": 38949984} {"current_steps": 30770, "total_steps": 40000, "loss": 0.0444, "lr": 0.037725190615030414, "epoch": 1.5034568685412748, "percentage": 76.92, "elapsed_time": "1 day, 8:30:22", "remaining_time": "9:45:02", "throughput": 332.9, "total_tokens": 38956512} {"current_steps": 30775, "total_steps": 40000, "loss": 0.0331, "lr": 0.037686137325163224, "epoch": 1.5037011702049692, "percentage": 76.94, "elapsed_time": "1 day, 8:30:25", "remaining_time": "9:44:39", "throughput": 332.95, "total_tokens": 38963200} {"current_steps": 30780, "total_steps": 40000, "loss": 0.044, "lr": 0.037647101355505065, "epoch": 1.5039454718686636, "percentage": 76.95, "elapsed_time": "1 day, 8:30:28", "remaining_time": "9:44:15", "throughput": 332.99, "total_tokens": 38969408} {"current_steps": 30785, "total_steps": 40000, "loss": 0.0343, "lr": 0.03760808271207581, "epoch": 1.5041897735323577, "percentage": 76.96, "elapsed_time": "1 day, 8:30:31", "remaining_time": "9:43:51", "throughput": 333.03, "total_tokens": 38975296} {"current_steps": 30790, "total_steps": 40000, "loss": 0.0433, "lr": 0.03756908140089258, "epoch": 1.504434075196052, "percentage": 76.98, "elapsed_time": "1 day, 8:30:34", "remaining_time": "9:43:27", "throughput": 333.08, "total_tokens": 38981952} {"current_steps": 30795, "total_steps": 40000, "loss": 0.0523, "lr": 0.03753009742796989, "epoch": 1.5046783768597463, "percentage": 76.99, "elapsed_time": "1 day, 8:30:37", "remaining_time": "9:43:04", "throughput": 333.12, "total_tokens": 38987904} {"current_steps": 30800, "total_steps": 40000, "loss": 0.0473, "lr": 0.037491130799319615, "epoch": 1.5049226785234406, "percentage": 77.0, "elapsed_time": "1 day, 8:30:40", "remaining_time": "9:42:40", "throughput": 333.17, "total_tokens": 38994368} {"current_steps": 30800, "total_steps": 40000, "eval_loss": 0.06161757558584213, "epoch": 1.5049226785234406, "percentage": 77.0, "elapsed_time": "1 day, 8:41:19", "remaining_time": "9:45:51", "throughput": 331.36, "total_tokens": 38994368} {"current_steps": 30805, "total_steps": 40000, "loss": 0.0393, "lr": 0.03745218152095079, "epoch": 1.505166980187135, "percentage": 77.01, "elapsed_time": "1 day, 8:41:25", "remaining_time": "9:45:27", "throughput": 331.4, "total_tokens": 39000832} {"current_steps": 30810, "total_steps": 40000, "loss": 0.0627, "lr": 0.037413249598869935, "epoch": 1.5054112818508294, "percentage": 77.03, "elapsed_time": "1 day, 8:41:28", "remaining_time": "9:45:04", "throughput": 331.45, "total_tokens": 39007360} {"current_steps": 30815, "total_steps": 40000, "loss": 0.0588, "lr": 0.037374335039080886, "epoch": 1.5056555835145238, "percentage": 77.04, "elapsed_time": "1 day, 8:41:31", "remaining_time": "9:44:40", "throughput": 331.49, "total_tokens": 39013984} {"current_steps": 30820, "total_steps": 40000, "loss": 0.0464, "lr": 0.037335437847584724, "epoch": 1.5058998851782182, "percentage": 77.05, "elapsed_time": "1 day, 8:41:34", "remaining_time": "9:44:16", "throughput": 331.54, "total_tokens": 39020672} {"current_steps": 30825, "total_steps": 40000, "loss": 0.0941, "lr": 0.03729655803037983, "epoch": 1.5061441868419125, "percentage": 77.06, "elapsed_time": "1 day, 8:41:37", "remaining_time": "9:43:52", "throughput": 331.59, "total_tokens": 39027040} {"current_steps": 30830, "total_steps": 40000, "loss": 0.0481, "lr": 0.03725769559346207, "epoch": 1.5063884885056067, "percentage": 77.08, "elapsed_time": "1 day, 8:41:40", "remaining_time": "9:43:28", "throughput": 331.63, "total_tokens": 39033504} {"current_steps": 30835, "total_steps": 40000, "loss": 0.0383, "lr": 0.03721885054282439, "epoch": 1.506632790169301, "percentage": 77.09, "elapsed_time": "1 day, 8:41:44", "remaining_time": "9:43:04", "throughput": 331.68, "total_tokens": 39040128} {"current_steps": 30840, "total_steps": 40000, "loss": 0.045, "lr": 0.03718002288445731, "epoch": 1.5068770918329952, "percentage": 77.1, "elapsed_time": "1 day, 8:41:47", "remaining_time": "9:42:41", "throughput": 331.73, "total_tokens": 39046560} {"current_steps": 30845, "total_steps": 40000, "loss": 0.0527, "lr": 0.03714121262434844, "epoch": 1.5071213934966896, "percentage": 77.11, "elapsed_time": "1 day, 8:41:50", "remaining_time": "9:42:17", "throughput": 331.77, "total_tokens": 39052576} {"current_steps": 30850, "total_steps": 40000, "loss": 0.0414, "lr": 0.037102419768482844, "epoch": 1.507365695160384, "percentage": 77.12, "elapsed_time": "1 day, 8:41:53", "remaining_time": "9:41:53", "throughput": 331.81, "total_tokens": 39058880} {"current_steps": 30855, "total_steps": 40000, "loss": 0.05, "lr": 0.03706364432284293, "epoch": 1.5076099968240784, "percentage": 77.14, "elapsed_time": "1 day, 8:41:56", "remaining_time": "9:41:29", "throughput": 331.86, "total_tokens": 39065152} {"current_steps": 30860, "total_steps": 40000, "loss": 0.0793, "lr": 0.03702488629340828, "epoch": 1.5078542984877727, "percentage": 77.15, "elapsed_time": "1 day, 8:41:59", "remaining_time": "9:41:05", "throughput": 331.9, "total_tokens": 39071424} {"current_steps": 30865, "total_steps": 40000, "loss": 0.069, "lr": 0.036986145686155915, "epoch": 1.5080986001514671, "percentage": 77.16, "elapsed_time": "1 day, 8:42:02", "remaining_time": "9:40:41", "throughput": 331.94, "total_tokens": 39077248} {"current_steps": 30870, "total_steps": 40000, "loss": 0.0329, "lr": 0.036947422507060075, "epoch": 1.5083429018151615, "percentage": 77.18, "elapsed_time": "1 day, 8:42:05", "remaining_time": "9:40:18", "throughput": 331.99, "total_tokens": 39083360} {"current_steps": 30875, "total_steps": 40000, "loss": 0.0634, "lr": 0.0369087167620924, "epoch": 1.5085872034788557, "percentage": 77.19, "elapsed_time": "1 day, 8:42:08", "remaining_time": "9:39:54", "throughput": 332.03, "total_tokens": 39089760} {"current_steps": 30880, "total_steps": 40000, "loss": 0.0418, "lr": 0.03687002845722183, "epoch": 1.50883150514255, "percentage": 77.2, "elapsed_time": "1 day, 8:42:11", "remaining_time": "9:39:30", "throughput": 332.08, "total_tokens": 39096448} {"current_steps": 30885, "total_steps": 40000, "loss": 0.061, "lr": 0.03683135759841451, "epoch": 1.5090758068062442, "percentage": 77.21, "elapsed_time": "1 day, 8:42:14", "remaining_time": "9:39:06", "throughput": 332.13, "total_tokens": 39102816} {"current_steps": 30890, "total_steps": 40000, "loss": 0.0507, "lr": 0.03679270419163406, "epoch": 1.5093201084699386, "percentage": 77.22, "elapsed_time": "1 day, 8:42:18", "remaining_time": "9:38:43", "throughput": 332.17, "total_tokens": 39109120} {"current_steps": 30895, "total_steps": 40000, "loss": 0.0464, "lr": 0.03675406824284127, "epoch": 1.509564410133633, "percentage": 77.24, "elapsed_time": "1 day, 8:42:21", "remaining_time": "9:38:19", "throughput": 332.21, "total_tokens": 39114912} {"current_steps": 30900, "total_steps": 40000, "loss": 0.0678, "lr": 0.03671544975799425, "epoch": 1.5098087117973273, "percentage": 77.25, "elapsed_time": "1 day, 8:42:23", "remaining_time": "9:37:55", "throughput": 332.25, "total_tokens": 39120800} {"current_steps": 30905, "total_steps": 40000, "loss": 0.0365, "lr": 0.03667684874304854, "epoch": 1.5100530134610217, "percentage": 77.26, "elapsed_time": "1 day, 8:42:27", "remaining_time": "9:37:31", "throughput": 332.3, "total_tokens": 39127072} {"current_steps": 30910, "total_steps": 40000, "loss": 0.0576, "lr": 0.03663826520395683, "epoch": 1.510297315124716, "percentage": 77.28, "elapsed_time": "1 day, 8:42:30", "remaining_time": "9:37:07", "throughput": 332.34, "total_tokens": 39132928} {"current_steps": 30915, "total_steps": 40000, "loss": 0.0379, "lr": 0.03659969914666922, "epoch": 1.5105416167884105, "percentage": 77.29, "elapsed_time": "1 day, 8:42:33", "remaining_time": "9:36:44", "throughput": 332.38, "total_tokens": 39139360} {"current_steps": 30920, "total_steps": 40000, "loss": 0.0719, "lr": 0.036561150577133106, "epoch": 1.5107859184521046, "percentage": 77.3, "elapsed_time": "1 day, 8:42:36", "remaining_time": "9:36:20", "throughput": 332.43, "total_tokens": 39145376} {"current_steps": 30925, "total_steps": 40000, "loss": 0.0834, "lr": 0.036522619501293103, "epoch": 1.511030220115799, "percentage": 77.31, "elapsed_time": "1 day, 8:42:39", "remaining_time": "9:35:56", "throughput": 332.47, "total_tokens": 39151968} {"current_steps": 30930, "total_steps": 40000, "loss": 0.0464, "lr": 0.03648410592509122, "epoch": 1.5112745217794932, "percentage": 77.33, "elapsed_time": "1 day, 8:42:42", "remaining_time": "9:35:32", "throughput": 332.52, "total_tokens": 39158144} {"current_steps": 30935, "total_steps": 40000, "loss": 0.0585, "lr": 0.03644560985446676, "epoch": 1.5115188234431876, "percentage": 77.34, "elapsed_time": "1 day, 8:42:45", "remaining_time": "9:35:09", "throughput": 332.57, "total_tokens": 39165024} {"current_steps": 30940, "total_steps": 40000, "loss": 0.0568, "lr": 0.036407131295356256, "epoch": 1.511763125106882, "percentage": 77.35, "elapsed_time": "1 day, 8:42:48", "remaining_time": "9:34:45", "throughput": 332.62, "total_tokens": 39171840} {"current_steps": 30945, "total_steps": 40000, "loss": 0.0477, "lr": 0.03636867025369362, "epoch": 1.5120074267705763, "percentage": 77.36, "elapsed_time": "1 day, 8:42:51", "remaining_time": "9:34:21", "throughput": 332.66, "total_tokens": 39178464} {"current_steps": 30950, "total_steps": 40000, "loss": 0.0589, "lr": 0.03633022673540999, "epoch": 1.5122517284342707, "percentage": 77.38, "elapsed_time": "1 day, 8:42:54", "remaining_time": "9:33:58", "throughput": 332.71, "total_tokens": 39184288} {"current_steps": 30955, "total_steps": 40000, "loss": 0.05, "lr": 0.03629180074643385, "epoch": 1.512496030097965, "percentage": 77.39, "elapsed_time": "1 day, 8:42:57", "remaining_time": "9:33:34", "throughput": 332.75, "total_tokens": 39190624} {"current_steps": 30960, "total_steps": 40000, "loss": 0.0504, "lr": 0.03625339229269102, "epoch": 1.5127403317616595, "percentage": 77.4, "elapsed_time": "1 day, 8:43:00", "remaining_time": "9:33:10", "throughput": 332.8, "total_tokens": 39197152} {"current_steps": 30965, "total_steps": 40000, "loss": 0.0644, "lr": 0.036215001380104535, "epoch": 1.5129846334253536, "percentage": 77.41, "elapsed_time": "1 day, 8:43:04", "remaining_time": "9:32:47", "throughput": 332.85, "total_tokens": 39203872} {"current_steps": 30970, "total_steps": 40000, "loss": 0.0511, "lr": 0.03617662801459471, "epoch": 1.513228935089048, "percentage": 77.42, "elapsed_time": "1 day, 8:43:07", "remaining_time": "9:32:23", "throughput": 332.89, "total_tokens": 39210176} {"current_steps": 30975, "total_steps": 40000, "loss": 0.0548, "lr": 0.036138272202079276, "epoch": 1.5134732367527421, "percentage": 77.44, "elapsed_time": "1 day, 8:43:10", "remaining_time": "9:31:59", "throughput": 332.94, "total_tokens": 39216608} {"current_steps": 30980, "total_steps": 40000, "loss": 0.0617, "lr": 0.036099933948473106, "epoch": 1.5137175384164365, "percentage": 77.45, "elapsed_time": "1 day, 8:43:13", "remaining_time": "9:31:36", "throughput": 332.98, "total_tokens": 39223040} {"current_steps": 30985, "total_steps": 40000, "loss": 0.0489, "lr": 0.03606161325968851, "epoch": 1.513961840080131, "percentage": 77.46, "elapsed_time": "1 day, 8:43:16", "remaining_time": "9:31:12", "throughput": 333.03, "total_tokens": 39229152} {"current_steps": 30990, "total_steps": 40000, "loss": 0.06, "lr": 0.03602331014163496, "epoch": 1.5142061417438253, "percentage": 77.48, "elapsed_time": "1 day, 8:43:19", "remaining_time": "9:30:48", "throughput": 333.07, "total_tokens": 39235776} {"current_steps": 30995, "total_steps": 40000, "loss": 0.0604, "lr": 0.035985024600219295, "epoch": 1.5144504434075197, "percentage": 77.49, "elapsed_time": "1 day, 8:43:22", "remaining_time": "9:30:25", "throughput": 333.12, "total_tokens": 39242272} {"current_steps": 31000, "total_steps": 40000, "loss": 0.086, "lr": 0.03594675664134569, "epoch": 1.514694745071214, "percentage": 77.5, "elapsed_time": "1 day, 8:43:25", "remaining_time": "9:30:01", "throughput": 333.16, "total_tokens": 39248416} {"current_steps": 31000, "total_steps": 40000, "eval_loss": 0.061992477625608444, "epoch": 1.514694745071214, "percentage": 77.5, "elapsed_time": "1 day, 8:54:04", "remaining_time": "9:33:07", "throughput": 331.37, "total_tokens": 39248416} {"current_steps": 31005, "total_steps": 40000, "loss": 0.0762, "lr": 0.03590850627091545, "epoch": 1.5149390467349084, "percentage": 77.51, "elapsed_time": "1 day, 8:54:08", "remaining_time": "9:32:43", "throughput": 331.41, "total_tokens": 39254784} {"current_steps": 31010, "total_steps": 40000, "loss": 0.0713, "lr": 0.03587027349482731, "epoch": 1.5151833483986026, "percentage": 77.53, "elapsed_time": "1 day, 8:54:11", "remaining_time": "9:32:19", "throughput": 331.46, "total_tokens": 39261728} {"current_steps": 31015, "total_steps": 40000, "loss": 0.0728, "lr": 0.035832058318977275, "epoch": 1.515427650062297, "percentage": 77.54, "elapsed_time": "1 day, 8:54:14", "remaining_time": "9:31:56", "throughput": 331.5, "total_tokens": 39267744} {"current_steps": 31020, "total_steps": 40000, "loss": 0.0763, "lr": 0.03579386074925853, "epoch": 1.5156719517259911, "percentage": 77.55, "elapsed_time": "1 day, 8:54:17", "remaining_time": "9:31:32", "throughput": 331.54, "total_tokens": 39273792} {"current_steps": 31025, "total_steps": 40000, "loss": 0.0695, "lr": 0.035755680791561696, "epoch": 1.5159162533896855, "percentage": 77.56, "elapsed_time": "1 day, 8:54:20", "remaining_time": "9:31:08", "throughput": 331.59, "total_tokens": 39280352} {"current_steps": 31030, "total_steps": 40000, "loss": 0.0573, "lr": 0.03571751845177454, "epoch": 1.5161605550533799, "percentage": 77.58, "elapsed_time": "1 day, 8:54:23", "remaining_time": "9:30:44", "throughput": 331.63, "total_tokens": 39286496} {"current_steps": 31035, "total_steps": 40000, "loss": 0.0514, "lr": 0.03567937373578225, "epoch": 1.5164048567170743, "percentage": 77.59, "elapsed_time": "1 day, 8:54:26", "remaining_time": "9:30:21", "throughput": 331.68, "total_tokens": 39292896} {"current_steps": 31040, "total_steps": 40000, "loss": 0.0499, "lr": 0.03564124664946711, "epoch": 1.5166491583807686, "percentage": 77.6, "elapsed_time": "1 day, 8:54:29", "remaining_time": "9:29:57", "throughput": 331.73, "total_tokens": 39299680} {"current_steps": 31045, "total_steps": 40000, "loss": 0.0382, "lr": 0.035603137198708924, "epoch": 1.516893460044463, "percentage": 77.61, "elapsed_time": "1 day, 8:54:33", "remaining_time": "9:29:33", "throughput": 331.77, "total_tokens": 39306336} {"current_steps": 31050, "total_steps": 40000, "loss": 0.0439, "lr": 0.035565045389384514, "epoch": 1.5171377617081574, "percentage": 77.62, "elapsed_time": "1 day, 8:54:36", "remaining_time": "9:29:10", "throughput": 331.82, "total_tokens": 39312704} {"current_steps": 31055, "total_steps": 40000, "loss": 0.0658, "lr": 0.03552697122736823, "epoch": 1.5173820633718516, "percentage": 77.64, "elapsed_time": "1 day, 8:54:39", "remaining_time": "9:28:46", "throughput": 331.87, "total_tokens": 39319296} {"current_steps": 31060, "total_steps": 40000, "loss": 0.0714, "lr": 0.03548891471853153, "epoch": 1.517626365035546, "percentage": 77.65, "elapsed_time": "1 day, 8:54:42", "remaining_time": "9:28:22", "throughput": 331.91, "total_tokens": 39325344} {"current_steps": 31065, "total_steps": 40000, "loss": 0.0461, "lr": 0.03545087586874322, "epoch": 1.51787066669924, "percentage": 77.66, "elapsed_time": "1 day, 8:54:45", "remaining_time": "9:27:59", "throughput": 331.95, "total_tokens": 39331552} {"current_steps": 31070, "total_steps": 40000, "loss": 0.083, "lr": 0.03541285468386935, "epoch": 1.5181149683629345, "percentage": 77.68, "elapsed_time": "1 day, 8:54:48", "remaining_time": "9:27:35", "throughput": 332.0, "total_tokens": 39337952} {"current_steps": 31075, "total_steps": 40000, "loss": 0.0651, "lr": 0.03537485116977327, "epoch": 1.5183592700266288, "percentage": 77.69, "elapsed_time": "1 day, 8:54:51", "remaining_time": "9:27:11", "throughput": 332.04, "total_tokens": 39344032} {"current_steps": 31080, "total_steps": 40000, "loss": 0.0958, "lr": 0.03533686533231565, "epoch": 1.5186035716903232, "percentage": 77.7, "elapsed_time": "1 day, 8:54:54", "remaining_time": "9:26:48", "throughput": 332.09, "total_tokens": 39350560} {"current_steps": 31085, "total_steps": 40000, "loss": 0.0813, "lr": 0.0352988971773543, "epoch": 1.5188478733540176, "percentage": 77.71, "elapsed_time": "1 day, 8:54:57", "remaining_time": "9:26:24", "throughput": 332.13, "total_tokens": 39356608} {"current_steps": 31090, "total_steps": 40000, "loss": 0.0727, "lr": 0.03526094671074443, "epoch": 1.519092175017712, "percentage": 77.72, "elapsed_time": "1 day, 8:55:00", "remaining_time": "9:26:00", "throughput": 332.17, "total_tokens": 39362816} {"current_steps": 31095, "total_steps": 40000, "loss": 0.0391, "lr": 0.03522301393833852, "epoch": 1.5193364766814061, "percentage": 77.74, "elapsed_time": "1 day, 8:55:03", "remaining_time": "9:25:37", "throughput": 332.22, "total_tokens": 39368992} {"current_steps": 31100, "total_steps": 40000, "loss": 0.0773, "lr": 0.035185098865986204, "epoch": 1.5195807783451005, "percentage": 77.75, "elapsed_time": "1 day, 8:55:06", "remaining_time": "9:25:13", "throughput": 332.26, "total_tokens": 39375392} {"current_steps": 31105, "total_steps": 40000, "loss": 0.0557, "lr": 0.03514720149953453, "epoch": 1.519825080008795, "percentage": 77.76, "elapsed_time": "1 day, 8:55:09", "remaining_time": "9:24:49", "throughput": 332.3, "total_tokens": 39381376} {"current_steps": 31110, "total_steps": 40000, "loss": 0.0562, "lr": 0.03510932184482773, "epoch": 1.520069381672489, "percentage": 77.78, "elapsed_time": "1 day, 8:55:12", "remaining_time": "9:24:26", "throughput": 332.35, "total_tokens": 39387456} {"current_steps": 31115, "total_steps": 40000, "loss": 0.0425, "lr": 0.03507145990770724, "epoch": 1.5203136833361834, "percentage": 77.79, "elapsed_time": "1 day, 8:55:16", "remaining_time": "9:24:02", "throughput": 332.39, "total_tokens": 39393728} {"current_steps": 31120, "total_steps": 40000, "loss": 0.0657, "lr": 0.035033615694011984, "epoch": 1.5205579849998778, "percentage": 77.8, "elapsed_time": "1 day, 8:55:19", "remaining_time": "9:23:39", "throughput": 332.44, "total_tokens": 39400224} {"current_steps": 31125, "total_steps": 40000, "loss": 0.0502, "lr": 0.03499578920957788, "epoch": 1.5208022866635722, "percentage": 77.81, "elapsed_time": "1 day, 8:55:22", "remaining_time": "9:23:15", "throughput": 332.48, "total_tokens": 39406656} {"current_steps": 31130, "total_steps": 40000, "loss": 0.0388, "lr": 0.034957980460238375, "epoch": 1.5210465883272666, "percentage": 77.83, "elapsed_time": "1 day, 8:55:25", "remaining_time": "9:22:51", "throughput": 332.53, "total_tokens": 39412736} {"current_steps": 31135, "total_steps": 40000, "loss": 0.0435, "lr": 0.03492018945182393, "epoch": 1.521290889990961, "percentage": 77.84, "elapsed_time": "1 day, 8:55:28", "remaining_time": "9:22:28", "throughput": 332.57, "total_tokens": 39418912} {"current_steps": 31140, "total_steps": 40000, "loss": 0.0602, "lr": 0.03488241619016247, "epoch": 1.5215351916546551, "percentage": 77.85, "elapsed_time": "1 day, 8:55:31", "remaining_time": "9:22:04", "throughput": 332.62, "total_tokens": 39425600} {"current_steps": 31145, "total_steps": 40000, "loss": 0.0513, "lr": 0.03484466068107913, "epoch": 1.5217794933183495, "percentage": 77.86, "elapsed_time": "1 day, 8:55:34", "remaining_time": "9:21:41", "throughput": 332.66, "total_tokens": 39432256} {"current_steps": 31150, "total_steps": 40000, "loss": 0.0562, "lr": 0.034806922930396195, "epoch": 1.5220237949820439, "percentage": 77.88, "elapsed_time": "1 day, 8:55:37", "remaining_time": "9:21:17", "throughput": 332.71, "total_tokens": 39438816} {"current_steps": 31155, "total_steps": 40000, "loss": 0.0917, "lr": 0.03476920294393337, "epoch": 1.522268096645738, "percentage": 77.89, "elapsed_time": "1 day, 8:55:40", "remaining_time": "9:20:54", "throughput": 332.76, "total_tokens": 39445248} {"current_steps": 31160, "total_steps": 40000, "loss": 0.0511, "lr": 0.03473150072750755, "epoch": 1.5225123983094324, "percentage": 77.9, "elapsed_time": "1 day, 8:55:43", "remaining_time": "9:20:30", "throughput": 332.8, "total_tokens": 39451616} {"current_steps": 31165, "total_steps": 40000, "loss": 0.05, "lr": 0.03469381628693284, "epoch": 1.5227566999731268, "percentage": 77.91, "elapsed_time": "1 day, 8:55:47", "remaining_time": "9:20:07", "throughput": 332.85, "total_tokens": 39458208} {"current_steps": 31170, "total_steps": 40000, "loss": 0.0611, "lr": 0.03465614962802072, "epoch": 1.5230010016368212, "percentage": 77.92, "elapsed_time": "1 day, 8:55:50", "remaining_time": "9:19:43", "throughput": 332.89, "total_tokens": 39464288} {"current_steps": 31175, "total_steps": 40000, "loss": 0.047, "lr": 0.0346185007565798, "epoch": 1.5232453033005156, "percentage": 77.94, "elapsed_time": "1 day, 8:55:53", "remaining_time": "9:19:19", "throughput": 332.93, "total_tokens": 39470304} {"current_steps": 31180, "total_steps": 40000, "loss": 0.0583, "lr": 0.03458086967841609, "epoch": 1.52348960496421, "percentage": 77.95, "elapsed_time": "1 day, 8:55:56", "remaining_time": "9:18:56", "throughput": 332.98, "total_tokens": 39476224} {"current_steps": 31185, "total_steps": 40000, "loss": 0.0435, "lr": 0.03454325639933266, "epoch": 1.523733906627904, "percentage": 77.96, "elapsed_time": "1 day, 8:55:59", "remaining_time": "9:18:32", "throughput": 333.02, "total_tokens": 39482784} {"current_steps": 31190, "total_steps": 40000, "loss": 0.0577, "lr": 0.03450566092513007, "epoch": 1.5239782082915985, "percentage": 77.98, "elapsed_time": "1 day, 8:56:02", "remaining_time": "9:18:09", "throughput": 333.06, "total_tokens": 39488672} {"current_steps": 31195, "total_steps": 40000, "loss": 0.074, "lr": 0.034468083261605914, "epoch": 1.5242225099552928, "percentage": 77.99, "elapsed_time": "1 day, 8:56:05", "remaining_time": "9:17:45", "throughput": 333.11, "total_tokens": 39494912} {"current_steps": 31200, "total_steps": 40000, "loss": 0.0554, "lr": 0.03443052341455522, "epoch": 1.524466811618987, "percentage": 78.0, "elapsed_time": "1 day, 8:56:08", "remaining_time": "9:17:22", "throughput": 333.15, "total_tokens": 39501152} {"current_steps": 31200, "total_steps": 40000, "eval_loss": 0.06144215911626816, "epoch": 1.524466811618987, "percentage": 78.0, "elapsed_time": "1 day, 9:06:46", "remaining_time": "9:20:22", "throughput": 331.37, "total_tokens": 39501152} {"current_steps": 31205, "total_steps": 40000, "loss": 0.053, "lr": 0.0343929813897701, "epoch": 1.5247111132826814, "percentage": 78.01, "elapsed_time": "1 day, 9:06:50", "remaining_time": "9:19:58", "throughput": 331.41, "total_tokens": 39507104} {"current_steps": 31210, "total_steps": 40000, "loss": 0.0595, "lr": 0.034355457193040125, "epoch": 1.5249554149463758, "percentage": 78.03, "elapsed_time": "1 day, 9:06:53", "remaining_time": "9:19:35", "throughput": 331.45, "total_tokens": 39513568} {"current_steps": 31215, "total_steps": 40000, "loss": 0.0671, "lr": 0.03431795083015186, "epoch": 1.5251997166100701, "percentage": 78.04, "elapsed_time": "1 day, 9:06:56", "remaining_time": "9:19:11", "throughput": 331.5, "total_tokens": 39520128} {"current_steps": 31220, "total_steps": 40000, "loss": 0.0636, "lr": 0.03428046230688936, "epoch": 1.5254440182737645, "percentage": 78.05, "elapsed_time": "1 day, 9:06:59", "remaining_time": "9:18:48", "throughput": 331.54, "total_tokens": 39526304} {"current_steps": 31225, "total_steps": 40000, "loss": 0.0546, "lr": 0.034242991629033805, "epoch": 1.525688319937459, "percentage": 78.06, "elapsed_time": "1 day, 9:07:02", "remaining_time": "9:18:24", "throughput": 331.59, "total_tokens": 39532672} {"current_steps": 31230, "total_steps": 40000, "loss": 0.0555, "lr": 0.03420553880236362, "epoch": 1.525932621601153, "percentage": 78.08, "elapsed_time": "1 day, 9:07:05", "remaining_time": "9:18:00", "throughput": 331.63, "total_tokens": 39539008} {"current_steps": 31235, "total_steps": 40000, "loss": 0.0666, "lr": 0.03416810383265449, "epoch": 1.5261769232648474, "percentage": 78.09, "elapsed_time": "1 day, 9:07:08", "remaining_time": "9:17:37", "throughput": 331.67, "total_tokens": 39544800} {"current_steps": 31240, "total_steps": 40000, "loss": 0.0406, "lr": 0.03413068672567944, "epoch": 1.5264212249285416, "percentage": 78.1, "elapsed_time": "1 day, 9:07:11", "remaining_time": "9:17:13", "throughput": 331.72, "total_tokens": 39551552} {"current_steps": 31245, "total_steps": 40000, "loss": 0.0437, "lr": 0.034093287487208565, "epoch": 1.526665526592236, "percentage": 78.11, "elapsed_time": "1 day, 9:07:14", "remaining_time": "9:16:50", "throughput": 331.76, "total_tokens": 39557536} {"current_steps": 31250, "total_steps": 40000, "loss": 0.0684, "lr": 0.03405590612300937, "epoch": 1.5269098282559304, "percentage": 78.12, "elapsed_time": "1 day, 9:07:17", "remaining_time": "9:16:26", "throughput": 331.8, "total_tokens": 39563584} {"current_steps": 31255, "total_steps": 40000, "loss": 0.0759, "lr": 0.03401854263884646, "epoch": 1.5271541299196247, "percentage": 78.14, "elapsed_time": "1 day, 9:07:20", "remaining_time": "9:16:03", "throughput": 331.85, "total_tokens": 39569632} {"current_steps": 31260, "total_steps": 40000, "loss": 0.0425, "lr": 0.033981197040481824, "epoch": 1.5273984315833191, "percentage": 78.15, "elapsed_time": "1 day, 9:07:24", "remaining_time": "9:15:39", "throughput": 331.89, "total_tokens": 39576192} {"current_steps": 31265, "total_steps": 40000, "loss": 0.0844, "lr": 0.03394386933367459, "epoch": 1.5276427332470135, "percentage": 78.16, "elapsed_time": "1 day, 9:07:27", "remaining_time": "9:15:15", "throughput": 331.94, "total_tokens": 39582368} {"current_steps": 31270, "total_steps": 40000, "loss": 0.0704, "lr": 0.033906559524181104, "epoch": 1.5278870349107079, "percentage": 78.17, "elapsed_time": "1 day, 9:07:30", "remaining_time": "9:14:52", "throughput": 331.98, "total_tokens": 39588160} {"current_steps": 31275, "total_steps": 40000, "loss": 0.0597, "lr": 0.033869267617755085, "epoch": 1.528131336574402, "percentage": 78.19, "elapsed_time": "1 day, 9:07:33", "remaining_time": "9:14:28", "throughput": 332.02, "total_tokens": 39594080} {"current_steps": 31280, "total_steps": 40000, "loss": 0.0592, "lr": 0.0338319936201474, "epoch": 1.5283756382380964, "percentage": 78.2, "elapsed_time": "1 day, 9:07:36", "remaining_time": "9:14:05", "throughput": 332.07, "total_tokens": 39600896} {"current_steps": 31285, "total_steps": 40000, "loss": 0.0761, "lr": 0.033794737537106136, "epoch": 1.5286199399017906, "percentage": 78.21, "elapsed_time": "1 day, 9:07:39", "remaining_time": "9:13:41", "throughput": 332.11, "total_tokens": 39607232} {"current_steps": 31290, "total_steps": 40000, "loss": 0.0484, "lr": 0.03375749937437671, "epoch": 1.528864241565485, "percentage": 78.22, "elapsed_time": "1 day, 9:07:42", "remaining_time": "9:13:18", "throughput": 332.16, "total_tokens": 39613728} {"current_steps": 31295, "total_steps": 40000, "loss": 0.064, "lr": 0.033720279137701634, "epoch": 1.5291085432291793, "percentage": 78.24, "elapsed_time": "1 day, 9:07:45", "remaining_time": "9:12:54", "throughput": 332.2, "total_tokens": 39619808} {"current_steps": 31300, "total_steps": 40000, "loss": 0.047, "lr": 0.03368307683282078, "epoch": 1.5293528448928737, "percentage": 78.25, "elapsed_time": "1 day, 9:07:48", "remaining_time": "9:12:31", "throughput": 332.24, "total_tokens": 39626176} {"current_steps": 31305, "total_steps": 40000, "loss": 0.0386, "lr": 0.033645892465471235, "epoch": 1.529597146556568, "percentage": 78.26, "elapsed_time": "1 day, 9:07:51", "remaining_time": "9:12:07", "throughput": 332.29, "total_tokens": 39633120} {"current_steps": 31310, "total_steps": 40000, "loss": 0.0594, "lr": 0.03360872604138724, "epoch": 1.5298414482202625, "percentage": 78.27, "elapsed_time": "1 day, 9:07:54", "remaining_time": "9:11:44", "throughput": 332.34, "total_tokens": 39639296} {"current_steps": 31315, "total_steps": 40000, "loss": 0.0629, "lr": 0.03357157756630034, "epoch": 1.5300857498839568, "percentage": 78.29, "elapsed_time": "1 day, 9:07:58", "remaining_time": "9:11:20", "throughput": 332.38, "total_tokens": 39646016} {"current_steps": 31320, "total_steps": 40000, "loss": 0.0821, "lr": 0.033534447045939365, "epoch": 1.530330051547651, "percentage": 78.3, "elapsed_time": "1 day, 9:08:01", "remaining_time": "9:10:57", "throughput": 332.43, "total_tokens": 39652160} {"current_steps": 31325, "total_steps": 40000, "loss": 0.0392, "lr": 0.03349733448603026, "epoch": 1.5305743532113454, "percentage": 78.31, "elapsed_time": "1 day, 9:08:04", "remaining_time": "9:10:34", "throughput": 332.47, "total_tokens": 39658400} {"current_steps": 31330, "total_steps": 40000, "loss": 0.0577, "lr": 0.03346023989229619, "epoch": 1.5308186548750395, "percentage": 78.33, "elapsed_time": "1 day, 9:08:07", "remaining_time": "9:10:10", "throughput": 332.52, "total_tokens": 39664960} {"current_steps": 31335, "total_steps": 40000, "loss": 0.0775, "lr": 0.03342316327045769, "epoch": 1.531062956538734, "percentage": 78.34, "elapsed_time": "1 day, 9:08:10", "remaining_time": "9:09:47", "throughput": 332.56, "total_tokens": 39671808} {"current_steps": 31340, "total_steps": 40000, "loss": 0.0507, "lr": 0.033386104626232385, "epoch": 1.5313072582024283, "percentage": 78.35, "elapsed_time": "1 day, 9:08:13", "remaining_time": "9:09:23", "throughput": 332.61, "total_tokens": 39678880} {"current_steps": 31345, "total_steps": 40000, "loss": 0.0415, "lr": 0.03334906396533525, "epoch": 1.5315515598661227, "percentage": 78.36, "elapsed_time": "1 day, 9:08:16", "remaining_time": "9:09:00", "throughput": 332.66, "total_tokens": 39685088} {"current_steps": 31350, "total_steps": 40000, "loss": 0.0622, "lr": 0.033312041293478326, "epoch": 1.531795861529817, "percentage": 78.38, "elapsed_time": "1 day, 9:08:19", "remaining_time": "9:08:36", "throughput": 332.7, "total_tokens": 39691232} {"current_steps": 31355, "total_steps": 40000, "loss": 0.0391, "lr": 0.03327503661637103, "epoch": 1.5320401631935114, "percentage": 78.39, "elapsed_time": "1 day, 9:08:23", "remaining_time": "9:08:13", "throughput": 332.75, "total_tokens": 39697792} {"current_steps": 31360, "total_steps": 40000, "loss": 0.0504, "lr": 0.03323804993971998, "epoch": 1.5322844648572058, "percentage": 78.4, "elapsed_time": "1 day, 9:08:26", "remaining_time": "9:07:50", "throughput": 332.79, "total_tokens": 39703904} {"current_steps": 31365, "total_steps": 40000, "loss": 0.0749, "lr": 0.033201081269228924, "epoch": 1.5325287665209, "percentage": 78.41, "elapsed_time": "1 day, 9:08:29", "remaining_time": "9:07:26", "throughput": 332.83, "total_tokens": 39709728} {"current_steps": 31370, "total_steps": 40000, "loss": 0.0636, "lr": 0.03316413061059895, "epoch": 1.5327730681845944, "percentage": 78.42, "elapsed_time": "1 day, 9:08:32", "remaining_time": "9:07:03", "throughput": 332.88, "total_tokens": 39716128} {"current_steps": 31375, "total_steps": 40000, "loss": 0.0395, "lr": 0.03312719796952827, "epoch": 1.5330173698482885, "percentage": 78.44, "elapsed_time": "1 day, 9:08:35", "remaining_time": "9:06:39", "throughput": 332.92, "total_tokens": 39722592} {"current_steps": 31380, "total_steps": 40000, "loss": 0.0654, "lr": 0.03309028335171236, "epoch": 1.533261671511983, "percentage": 78.45, "elapsed_time": "1 day, 9:08:38", "remaining_time": "9:06:16", "throughput": 332.97, "total_tokens": 39729440} {"current_steps": 31385, "total_steps": 40000, "loss": 0.075, "lr": 0.03305338676284398, "epoch": 1.5335059731756773, "percentage": 78.46, "elapsed_time": "1 day, 9:08:41", "remaining_time": "9:05:53", "throughput": 333.02, "total_tokens": 39737024} {"current_steps": 31390, "total_steps": 40000, "loss": 0.031, "lr": 0.03301650820861296, "epoch": 1.5337502748393717, "percentage": 78.47, "elapsed_time": "1 day, 9:08:44", "remaining_time": "9:05:29", "throughput": 333.07, "total_tokens": 39742976} {"current_steps": 31395, "total_steps": 40000, "loss": 0.0541, "lr": 0.03297964769470652, "epoch": 1.533994576503066, "percentage": 78.49, "elapsed_time": "1 day, 9:08:47", "remaining_time": "9:05:06", "throughput": 333.11, "total_tokens": 39749280} {"current_steps": 31400, "total_steps": 40000, "loss": 0.0353, "lr": 0.032942805226808945, "epoch": 1.5342388781667604, "percentage": 78.5, "elapsed_time": "1 day, 9:08:51", "remaining_time": "9:04:43", "throughput": 333.16, "total_tokens": 39756224} {"current_steps": 31400, "total_steps": 40000, "eval_loss": 0.061628974974155426, "epoch": 1.5342388781667604, "percentage": 78.5, "elapsed_time": "1 day, 9:19:29", "remaining_time": "9:07:37", "throughput": 331.39, "total_tokens": 39756224} {"current_steps": 31405, "total_steps": 40000, "loss": 0.0484, "lr": 0.03290598081060187, "epoch": 1.5344831798304548, "percentage": 78.51, "elapsed_time": "1 day, 9:19:34", "remaining_time": "9:07:14", "throughput": 331.43, "total_tokens": 39762656} {"current_steps": 31410, "total_steps": 40000, "loss": 0.0695, "lr": 0.03286917445176407, "epoch": 1.534727481494149, "percentage": 78.53, "elapsed_time": "1 day, 9:19:37", "remaining_time": "9:06:51", "throughput": 331.47, "total_tokens": 39769440} {"current_steps": 31415, "total_steps": 40000, "loss": 0.0315, "lr": 0.032832386155971456, "epoch": 1.5349717831578433, "percentage": 78.54, "elapsed_time": "1 day, 9:19:40", "remaining_time": "9:06:27", "throughput": 331.52, "total_tokens": 39775904} {"current_steps": 31420, "total_steps": 40000, "loss": 0.0435, "lr": 0.032795615928897334, "epoch": 1.5352160848215375, "percentage": 78.55, "elapsed_time": "1 day, 9:19:43", "remaining_time": "9:06:04", "throughput": 331.57, "total_tokens": 39782560} {"current_steps": 31425, "total_steps": 40000, "loss": 0.0731, "lr": 0.03275886377621215, "epoch": 1.5354603864852319, "percentage": 78.56, "elapsed_time": "1 day, 9:19:46", "remaining_time": "9:05:40", "throughput": 331.61, "total_tokens": 39788640} {"current_steps": 31430, "total_steps": 40000, "loss": 0.0727, "lr": 0.03272212970358348, "epoch": 1.5357046881489262, "percentage": 78.57, "elapsed_time": "1 day, 9:19:49", "remaining_time": "9:05:17", "throughput": 331.66, "total_tokens": 39795520} {"current_steps": 31435, "total_steps": 40000, "loss": 0.0528, "lr": 0.032685413716676215, "epoch": 1.5359489898126206, "percentage": 78.59, "elapsed_time": "1 day, 9:19:52", "remaining_time": "9:04:54", "throughput": 331.7, "total_tokens": 39802048} {"current_steps": 31440, "total_steps": 40000, "loss": 0.0387, "lr": 0.032648715821152474, "epoch": 1.536193291476315, "percentage": 78.6, "elapsed_time": "1 day, 9:19:55", "remaining_time": "9:04:30", "throughput": 331.75, "total_tokens": 39808128} {"current_steps": 31445, "total_steps": 40000, "loss": 0.0513, "lr": 0.03261203602267143, "epoch": 1.5364375931400094, "percentage": 78.61, "elapsed_time": "1 day, 9:19:58", "remaining_time": "9:04:07", "throughput": 331.79, "total_tokens": 39814272} {"current_steps": 31450, "total_steps": 40000, "loss": 0.0646, "lr": 0.03257537432688966, "epoch": 1.5366818948037038, "percentage": 78.62, "elapsed_time": "1 day, 9:20:02", "remaining_time": "9:03:43", "throughput": 331.83, "total_tokens": 39820800} {"current_steps": 31455, "total_steps": 40000, "loss": 0.0566, "lr": 0.03253873073946077, "epoch": 1.536926196467398, "percentage": 78.64, "elapsed_time": "1 day, 9:20:05", "remaining_time": "9:03:20", "throughput": 331.88, "total_tokens": 39826784} {"current_steps": 31460, "total_steps": 40000, "loss": 0.0689, "lr": 0.03250210526603572, "epoch": 1.5371704981310923, "percentage": 78.65, "elapsed_time": "1 day, 9:20:08", "remaining_time": "9:02:56", "throughput": 331.92, "total_tokens": 39832672} {"current_steps": 31465, "total_steps": 40000, "loss": 0.0363, "lr": 0.03246549791226266, "epoch": 1.5374147997947865, "percentage": 78.66, "elapsed_time": "1 day, 9:20:11", "remaining_time": "9:02:33", "throughput": 331.96, "total_tokens": 39839200} {"current_steps": 31470, "total_steps": 40000, "loss": 0.0563, "lr": 0.03242890868378679, "epoch": 1.5376591014584808, "percentage": 78.67, "elapsed_time": "1 day, 9:20:14", "remaining_time": "9:02:10", "throughput": 332.01, "total_tokens": 39845376} {"current_steps": 31475, "total_steps": 40000, "loss": 0.06, "lr": 0.03239233758625074, "epoch": 1.5379034031221752, "percentage": 78.69, "elapsed_time": "1 day, 9:20:17", "remaining_time": "9:01:46", "throughput": 332.05, "total_tokens": 39851840} {"current_steps": 31480, "total_steps": 40000, "loss": 0.0664, "lr": 0.032355784625294204, "epoch": 1.5381477047858696, "percentage": 78.7, "elapsed_time": "1 day, 9:20:20", "remaining_time": "9:01:23", "throughput": 332.1, "total_tokens": 39858496} {"current_steps": 31485, "total_steps": 40000, "loss": 0.0432, "lr": 0.03231924980655402, "epoch": 1.538392006449564, "percentage": 78.71, "elapsed_time": "1 day, 9:20:23", "remaining_time": "9:01:00", "throughput": 332.15, "total_tokens": 39866240} {"current_steps": 31490, "total_steps": 40000, "loss": 0.0894, "lr": 0.032282733135664446, "epoch": 1.5386363081132584, "percentage": 78.72, "elapsed_time": "1 day, 9:20:27", "remaining_time": "9:00:36", "throughput": 332.2, "total_tokens": 39872640} {"current_steps": 31495, "total_steps": 40000, "loss": 0.0359, "lr": 0.03224623461825669, "epoch": 1.5388806097769527, "percentage": 78.74, "elapsed_time": "1 day, 9:20:30", "remaining_time": "9:00:13", "throughput": 332.24, "total_tokens": 39879008} {"current_steps": 31500, "total_steps": 40000, "loss": 0.085, "lr": 0.03220975425995937, "epoch": 1.539124911440647, "percentage": 78.75, "elapsed_time": "1 day, 9:20:33", "remaining_time": "8:59:49", "throughput": 332.29, "total_tokens": 39885408} {"current_steps": 31505, "total_steps": 40000, "loss": 0.0272, "lr": 0.032173292066398206, "epoch": 1.5393692131043413, "percentage": 78.76, "elapsed_time": "1 day, 9:20:36", "remaining_time": "8:59:26", "throughput": 332.33, "total_tokens": 39891584} {"current_steps": 31510, "total_steps": 40000, "loss": 0.0417, "lr": 0.03213684804319606, "epoch": 1.5396135147680354, "percentage": 78.77, "elapsed_time": "1 day, 9:20:39", "remaining_time": "8:59:03", "throughput": 332.37, "total_tokens": 39897952} {"current_steps": 31515, "total_steps": 40000, "loss": 0.0543, "lr": 0.03210042219597312, "epoch": 1.5398578164317298, "percentage": 78.79, "elapsed_time": "1 day, 9:20:42", "remaining_time": "8:58:39", "throughput": 332.42, "total_tokens": 39904128} {"current_steps": 31520, "total_steps": 40000, "loss": 0.0752, "lr": 0.03206401453034675, "epoch": 1.5401021180954242, "percentage": 78.8, "elapsed_time": "1 day, 9:20:45", "remaining_time": "8:58:16", "throughput": 332.46, "total_tokens": 39910432} {"current_steps": 31525, "total_steps": 40000, "loss": 0.0559, "lr": 0.03202762505193136, "epoch": 1.5403464197591186, "percentage": 78.81, "elapsed_time": "1 day, 9:20:48", "remaining_time": "8:57:53", "throughput": 332.51, "total_tokens": 39917312} {"current_steps": 31530, "total_steps": 40000, "loss": 0.0518, "lr": 0.031991253766338754, "epoch": 1.540590721422813, "percentage": 78.83, "elapsed_time": "1 day, 9:20:51", "remaining_time": "8:57:29", "throughput": 332.55, "total_tokens": 39923648} {"current_steps": 31535, "total_steps": 40000, "loss": 0.0494, "lr": 0.03195490067917778, "epoch": 1.5408350230865073, "percentage": 78.84, "elapsed_time": "1 day, 9:20:54", "remaining_time": "8:57:06", "throughput": 332.6, "total_tokens": 39929888} {"current_steps": 31540, "total_steps": 40000, "loss": 0.0435, "lr": 0.03191856579605461, "epoch": 1.5410793247502017, "percentage": 78.85, "elapsed_time": "1 day, 9:20:57", "remaining_time": "8:56:43", "throughput": 332.64, "total_tokens": 39936032} {"current_steps": 31545, "total_steps": 40000, "loss": 0.0546, "lr": 0.031882249122572454, "epoch": 1.5413236264138959, "percentage": 78.86, "elapsed_time": "1 day, 9:21:01", "remaining_time": "8:56:19", "throughput": 332.69, "total_tokens": 39942720} {"current_steps": 31550, "total_steps": 40000, "loss": 0.0508, "lr": 0.03184595066433188, "epoch": 1.5415679280775902, "percentage": 78.88, "elapsed_time": "1 day, 9:21:04", "remaining_time": "8:55:56", "throughput": 332.73, "total_tokens": 39949120} {"current_steps": 31555, "total_steps": 40000, "loss": 0.0635, "lr": 0.03180967042693049, "epoch": 1.5418122297412844, "percentage": 78.89, "elapsed_time": "1 day, 9:21:07", "remaining_time": "8:55:33", "throughput": 332.78, "total_tokens": 39956096} {"current_steps": 31560, "total_steps": 40000, "loss": 0.0666, "lr": 0.03177340841596323, "epoch": 1.5420565314049788, "percentage": 78.9, "elapsed_time": "1 day, 9:21:10", "remaining_time": "8:55:10", "throughput": 332.82, "total_tokens": 39962432} {"current_steps": 31565, "total_steps": 40000, "loss": 0.0486, "lr": 0.03173716463702209, "epoch": 1.5423008330686732, "percentage": 78.91, "elapsed_time": "1 day, 9:21:13", "remaining_time": "8:54:46", "throughput": 332.87, "total_tokens": 39968672} {"current_steps": 31570, "total_steps": 40000, "loss": 0.0809, "lr": 0.03170093909569638, "epoch": 1.5425451347323675, "percentage": 78.92, "elapsed_time": "1 day, 9:21:16", "remaining_time": "8:54:23", "throughput": 332.91, "total_tokens": 39974816} {"current_steps": 31575, "total_steps": 40000, "loss": 0.0634, "lr": 0.03166473179757246, "epoch": 1.542789436396062, "percentage": 78.94, "elapsed_time": "1 day, 9:21:19", "remaining_time": "8:54:00", "throughput": 332.95, "total_tokens": 39980928} {"current_steps": 31580, "total_steps": 40000, "loss": 0.0301, "lr": 0.031628542748234005, "epoch": 1.5430337380597563, "percentage": 78.95, "elapsed_time": "1 day, 9:21:22", "remaining_time": "8:53:36", "throughput": 333.0, "total_tokens": 39987168} {"current_steps": 31585, "total_steps": 40000, "loss": 0.0437, "lr": 0.03159237195326184, "epoch": 1.5432780397234507, "percentage": 78.96, "elapsed_time": "1 day, 9:21:25", "remaining_time": "8:53:13", "throughput": 333.04, "total_tokens": 39993376} {"current_steps": 31590, "total_steps": 40000, "loss": 0.049, "lr": 0.031556219418233875, "epoch": 1.5435223413871448, "percentage": 78.97, "elapsed_time": "1 day, 9:21:28", "remaining_time": "8:52:50", "throughput": 333.09, "total_tokens": 40000064} {"current_steps": 31595, "total_steps": 40000, "loss": 0.0239, "lr": 0.03152008514872533, "epoch": 1.5437666430508392, "percentage": 78.99, "elapsed_time": "1 day, 9:21:32", "remaining_time": "8:52:27", "throughput": 333.13, "total_tokens": 40006560} {"current_steps": 31600, "total_steps": 40000, "loss": 0.0717, "lr": 0.03148396915030862, "epoch": 1.5440109447145334, "percentage": 79.0, "elapsed_time": "1 day, 9:21:35", "remaining_time": "8:52:04", "throughput": 333.18, "total_tokens": 40012896} {"current_steps": 31600, "total_steps": 40000, "eval_loss": 0.061177898198366165, "epoch": 1.5440109447145334, "percentage": 79.0, "elapsed_time": "1 day, 9:32:14", "remaining_time": "8:54:53", "throughput": 331.41, "total_tokens": 40012896} {"current_steps": 31605, "total_steps": 40000, "loss": 0.0602, "lr": 0.03144787142855318, "epoch": 1.5442552463782278, "percentage": 79.01, "elapsed_time": "1 day, 9:32:18", "remaining_time": "8:54:30", "throughput": 331.46, "total_tokens": 40019648} {"current_steps": 31610, "total_steps": 40000, "loss": 0.0605, "lr": 0.031411791989025835, "epoch": 1.5444995480419221, "percentage": 79.03, "elapsed_time": "1 day, 9:32:21", "remaining_time": "8:54:07", "throughput": 331.5, "total_tokens": 40026208} {"current_steps": 31615, "total_steps": 40000, "loss": 0.0473, "lr": 0.031375730837290394, "epoch": 1.5447438497056165, "percentage": 79.04, "elapsed_time": "1 day, 9:32:24", "remaining_time": "8:53:44", "throughput": 331.54, "total_tokens": 40031840} {"current_steps": 31620, "total_steps": 40000, "loss": 0.0593, "lr": 0.031339687978908015, "epoch": 1.544988151369311, "percentage": 79.05, "elapsed_time": "1 day, 9:32:27", "remaining_time": "8:53:20", "throughput": 331.59, "total_tokens": 40038752} {"current_steps": 31625, "total_steps": 40000, "loss": 0.0383, "lr": 0.03130366341943694, "epoch": 1.5452324530330053, "percentage": 79.06, "elapsed_time": "1 day, 9:32:30", "remaining_time": "8:52:57", "throughput": 331.64, "total_tokens": 40045248} {"current_steps": 31630, "total_steps": 40000, "loss": 0.0698, "lr": 0.031267657164432555, "epoch": 1.5454767546966997, "percentage": 79.07, "elapsed_time": "1 day, 9:32:34", "remaining_time": "8:52:34", "throughput": 331.68, "total_tokens": 40051680} {"current_steps": 31635, "total_steps": 40000, "loss": 0.0847, "lr": 0.03123166921944752, "epoch": 1.5457210563603938, "percentage": 79.09, "elapsed_time": "1 day, 9:32:37", "remaining_time": "8:52:10", "throughput": 331.72, "total_tokens": 40058112} {"current_steps": 31640, "total_steps": 40000, "loss": 0.0438, "lr": 0.031195699590031666, "epoch": 1.5459653580240882, "percentage": 79.1, "elapsed_time": "1 day, 9:32:40", "remaining_time": "8:51:47", "throughput": 331.76, "total_tokens": 40063968} {"current_steps": 31645, "total_steps": 40000, "loss": 0.0635, "lr": 0.031159748281731885, "epoch": 1.5462096596877823, "percentage": 79.11, "elapsed_time": "1 day, 9:32:43", "remaining_time": "8:51:24", "throughput": 331.81, "total_tokens": 40070048} {"current_steps": 31650, "total_steps": 40000, "loss": 0.0829, "lr": 0.031123815300092394, "epoch": 1.5464539613514767, "percentage": 79.12, "elapsed_time": "1 day, 9:32:46", "remaining_time": "8:51:00", "throughput": 331.85, "total_tokens": 40076000} {"current_steps": 31655, "total_steps": 40000, "loss": 0.0438, "lr": 0.031087900650654424, "epoch": 1.546698263015171, "percentage": 79.14, "elapsed_time": "1 day, 9:32:49", "remaining_time": "8:50:37", "throughput": 331.9, "total_tokens": 40082976} {"current_steps": 31660, "total_steps": 40000, "loss": 0.0381, "lr": 0.031052004338956534, "epoch": 1.5469425646788655, "percentage": 79.15, "elapsed_time": "1 day, 9:32:52", "remaining_time": "8:50:14", "throughput": 331.94, "total_tokens": 40089536} {"current_steps": 31665, "total_steps": 40000, "loss": 0.054, "lr": 0.031016126370534407, "epoch": 1.5471868663425599, "percentage": 79.16, "elapsed_time": "1 day, 9:32:55", "remaining_time": "8:49:51", "throughput": 331.98, "total_tokens": 40095680} {"current_steps": 31670, "total_steps": 40000, "loss": 0.0479, "lr": 0.030980266750920804, "epoch": 1.5474311680062542, "percentage": 79.17, "elapsed_time": "1 day, 9:32:58", "remaining_time": "8:49:27", "throughput": 332.03, "total_tokens": 40101824} {"current_steps": 31675, "total_steps": 40000, "loss": 0.0684, "lr": 0.030944425485645747, "epoch": 1.5476754696699484, "percentage": 79.19, "elapsed_time": "1 day, 9:33:01", "remaining_time": "8:49:04", "throughput": 332.07, "total_tokens": 40108032} {"current_steps": 31680, "total_steps": 40000, "loss": 0.0407, "lr": 0.03090860258023647, "epoch": 1.5479197713336428, "percentage": 79.2, "elapsed_time": "1 day, 9:33:04", "remaining_time": "8:48:41", "throughput": 332.11, "total_tokens": 40114272} {"current_steps": 31685, "total_steps": 40000, "loss": 0.0592, "lr": 0.030872798040217236, "epoch": 1.5481640729973372, "percentage": 79.21, "elapsed_time": "1 day, 9:33:07", "remaining_time": "8:48:18", "throughput": 332.16, "total_tokens": 40120608} {"current_steps": 31690, "total_steps": 40000, "loss": 0.0869, "lr": 0.03083701187110964, "epoch": 1.5484083746610313, "percentage": 79.22, "elapsed_time": "1 day, 9:33:11", "remaining_time": "8:47:54", "throughput": 332.2, "total_tokens": 40127168} {"current_steps": 31695, "total_steps": 40000, "loss": 0.0814, "lr": 0.030801244078432294, "epoch": 1.5486526763247257, "percentage": 79.24, "elapsed_time": "1 day, 9:33:14", "remaining_time": "8:47:31", "throughput": 332.25, "total_tokens": 40133248} {"current_steps": 31700, "total_steps": 40000, "loss": 0.0724, "lr": 0.030765494667701024, "epoch": 1.54889697798842, "percentage": 79.25, "elapsed_time": "1 day, 9:33:17", "remaining_time": "8:47:08", "throughput": 332.29, "total_tokens": 40139264} {"current_steps": 31705, "total_steps": 40000, "loss": 0.0846, "lr": 0.030729763644428913, "epoch": 1.5491412796521145, "percentage": 79.26, "elapsed_time": "1 day, 9:33:20", "remaining_time": "8:46:45", "throughput": 332.33, "total_tokens": 40145760} {"current_steps": 31710, "total_steps": 40000, "loss": 0.0495, "lr": 0.030694051014126048, "epoch": 1.5493855813158088, "percentage": 79.27, "elapsed_time": "1 day, 9:33:23", "remaining_time": "8:46:21", "throughput": 332.38, "total_tokens": 40152960} {"current_steps": 31715, "total_steps": 40000, "loss": 0.0402, "lr": 0.030658356782299792, "epoch": 1.5496298829795032, "percentage": 79.29, "elapsed_time": "1 day, 9:33:26", "remaining_time": "8:45:58", "throughput": 332.43, "total_tokens": 40159680} {"current_steps": 31720, "total_steps": 40000, "loss": 0.0719, "lr": 0.030622680954454726, "epoch": 1.5498741846431974, "percentage": 79.3, "elapsed_time": "1 day, 9:33:29", "remaining_time": "8:45:35", "throughput": 332.47, "total_tokens": 40166016} {"current_steps": 31725, "total_steps": 40000, "loss": 0.0717, "lr": 0.030587023536092398, "epoch": 1.5501184863068918, "percentage": 79.31, "elapsed_time": "1 day, 9:33:32", "remaining_time": "8:45:12", "throughput": 332.52, "total_tokens": 40172320} {"current_steps": 31730, "total_steps": 40000, "loss": 0.0598, "lr": 0.03055138453271171, "epoch": 1.5503627879705861, "percentage": 79.33, "elapsed_time": "1 day, 9:33:35", "remaining_time": "8:44:49", "throughput": 332.56, "total_tokens": 40178528} {"current_steps": 31735, "total_steps": 40000, "loss": 0.0734, "lr": 0.03051576394980858, "epoch": 1.5506070896342803, "percentage": 79.34, "elapsed_time": "1 day, 9:33:39", "remaining_time": "8:44:25", "throughput": 332.6, "total_tokens": 40184992} {"current_steps": 31740, "total_steps": 40000, "loss": 0.0303, "lr": 0.030480161792876187, "epoch": 1.5508513912979747, "percentage": 79.35, "elapsed_time": "1 day, 9:33:42", "remaining_time": "8:44:02", "throughput": 332.65, "total_tokens": 40191712} {"current_steps": 31745, "total_steps": 40000, "loss": 0.0337, "lr": 0.030444578067404846, "epoch": 1.551095692961669, "percentage": 79.36, "elapsed_time": "1 day, 9:33:45", "remaining_time": "8:43:39", "throughput": 332.69, "total_tokens": 40197728} {"current_steps": 31750, "total_steps": 40000, "loss": 0.0643, "lr": 0.030409012778881975, "epoch": 1.5513399946253634, "percentage": 79.38, "elapsed_time": "1 day, 9:33:48", "remaining_time": "8:43:16", "throughput": 332.74, "total_tokens": 40204320} {"current_steps": 31755, "total_steps": 40000, "loss": 0.0819, "lr": 0.030373465932792235, "epoch": 1.5515842962890578, "percentage": 79.39, "elapsed_time": "1 day, 9:33:51", "remaining_time": "8:42:53", "throughput": 332.78, "total_tokens": 40210560} {"current_steps": 31760, "total_steps": 40000, "loss": 0.0624, "lr": 0.030337937534617342, "epoch": 1.5518285979527522, "percentage": 79.4, "elapsed_time": "1 day, 9:33:54", "remaining_time": "8:42:30", "throughput": 332.83, "total_tokens": 40217344} {"current_steps": 31765, "total_steps": 40000, "loss": 0.0528, "lr": 0.030302427589836277, "epoch": 1.5520728996164463, "percentage": 79.41, "elapsed_time": "1 day, 9:33:57", "remaining_time": "8:42:06", "throughput": 332.87, "total_tokens": 40223584} {"current_steps": 31770, "total_steps": 40000, "loss": 0.0429, "lr": 0.030266936103925095, "epoch": 1.5523172012801407, "percentage": 79.42, "elapsed_time": "1 day, 9:34:00", "remaining_time": "8:41:43", "throughput": 332.92, "total_tokens": 40230048} {"current_steps": 31775, "total_steps": 40000, "loss": 0.0783, "lr": 0.030231463082356982, "epoch": 1.5525615029438349, "percentage": 79.44, "elapsed_time": "1 day, 9:34:03", "remaining_time": "8:41:20", "throughput": 332.96, "total_tokens": 40236416} {"current_steps": 31780, "total_steps": 40000, "loss": 0.0533, "lr": 0.030196008530602367, "epoch": 1.5528058046075293, "percentage": 79.45, "elapsed_time": "1 day, 9:34:06", "remaining_time": "8:40:57", "throughput": 333.0, "total_tokens": 40242560} {"current_steps": 31785, "total_steps": 40000, "loss": 0.0444, "lr": 0.030160572454128842, "epoch": 1.5530501062712236, "percentage": 79.46, "elapsed_time": "1 day, 9:34:09", "remaining_time": "8:40:34", "throughput": 333.05, "total_tokens": 40248992} {"current_steps": 31790, "total_steps": 40000, "loss": 0.0667, "lr": 0.03012515485840098, "epoch": 1.553294407934918, "percentage": 79.47, "elapsed_time": "1 day, 9:34:13", "remaining_time": "8:40:11", "throughput": 333.09, "total_tokens": 40255552} {"current_steps": 31795, "total_steps": 40000, "loss": 0.1018, "lr": 0.030089755748880734, "epoch": 1.5535387095986124, "percentage": 79.49, "elapsed_time": "1 day, 9:34:16", "remaining_time": "8:39:48", "throughput": 333.14, "total_tokens": 40261856} {"current_steps": 31800, "total_steps": 40000, "loss": 0.0425, "lr": 0.030054375131027003, "epoch": 1.5537830112623068, "percentage": 79.5, "elapsed_time": "1 day, 9:34:19", "remaining_time": "8:39:24", "throughput": 333.18, "total_tokens": 40268416} {"current_steps": 31800, "total_steps": 40000, "eval_loss": 0.06169683486223221, "epoch": 1.5537830112623068, "percentage": 79.5, "elapsed_time": "1 day, 9:44:59", "remaining_time": "8:42:10", "throughput": 331.43, "total_tokens": 40268416} {"current_steps": 31805, "total_steps": 40000, "loss": 0.0468, "lr": 0.030019013010295942, "epoch": 1.5540273129260012, "percentage": 79.51, "elapsed_time": "1 day, 9:45:04", "remaining_time": "8:41:47", "throughput": 331.47, "total_tokens": 40275104} {"current_steps": 31810, "total_steps": 40000, "loss": 0.0591, "lr": 0.029983669392140897, "epoch": 1.5542716145896953, "percentage": 79.53, "elapsed_time": "1 day, 9:45:07", "remaining_time": "8:41:24", "throughput": 331.52, "total_tokens": 40282080} {"current_steps": 31815, "total_steps": 40000, "loss": 0.0626, "lr": 0.029948344282012217, "epoch": 1.5545159162533897, "percentage": 79.54, "elapsed_time": "1 day, 9:45:10", "remaining_time": "8:41:00", "throughput": 331.56, "total_tokens": 40288128} {"current_steps": 31820, "total_steps": 40000, "loss": 0.0587, "lr": 0.029913037685357507, "epoch": 1.5547602179170839, "percentage": 79.55, "elapsed_time": "1 day, 9:45:13", "remaining_time": "8:40:37", "throughput": 331.6, "total_tokens": 40294464} {"current_steps": 31825, "total_steps": 40000, "loss": 0.055, "lr": 0.029877749607621528, "epoch": 1.5550045195807782, "percentage": 79.56, "elapsed_time": "1 day, 9:45:16", "remaining_time": "8:40:14", "throughput": 331.65, "total_tokens": 40300832} {"current_steps": 31830, "total_steps": 40000, "loss": 0.0606, "lr": 0.029842480054246077, "epoch": 1.5552488212444726, "percentage": 79.57, "elapsed_time": "1 day, 9:45:20", "remaining_time": "8:39:51", "throughput": 331.69, "total_tokens": 40307520} {"current_steps": 31835, "total_steps": 40000, "loss": 0.0527, "lr": 0.02980722903067022, "epoch": 1.555493122908167, "percentage": 79.59, "elapsed_time": "1 day, 9:45:23", "remaining_time": "8:39:28", "throughput": 331.74, "total_tokens": 40313856} {"current_steps": 31840, "total_steps": 40000, "loss": 0.0547, "lr": 0.029771996542330113, "epoch": 1.5557374245718614, "percentage": 79.6, "elapsed_time": "1 day, 9:45:26", "remaining_time": "8:39:04", "throughput": 331.78, "total_tokens": 40320064} {"current_steps": 31845, "total_steps": 40000, "loss": 0.0716, "lr": 0.029736782594658954, "epoch": 1.5559817262355558, "percentage": 79.61, "elapsed_time": "1 day, 9:45:29", "remaining_time": "8:38:41", "throughput": 331.82, "total_tokens": 40325888} {"current_steps": 31850, "total_steps": 40000, "loss": 0.0512, "lr": 0.029701587193087284, "epoch": 1.5562260278992501, "percentage": 79.62, "elapsed_time": "1 day, 9:45:32", "remaining_time": "8:38:18", "throughput": 331.87, "total_tokens": 40332768} {"current_steps": 31855, "total_steps": 40000, "loss": 0.0289, "lr": 0.0296664103430426, "epoch": 1.5564703295629443, "percentage": 79.64, "elapsed_time": "1 day, 9:45:35", "remaining_time": "8:37:55", "throughput": 331.92, "total_tokens": 40339584} {"current_steps": 31860, "total_steps": 40000, "loss": 0.0489, "lr": 0.029631252049949652, "epoch": 1.5567146312266387, "percentage": 79.65, "elapsed_time": "1 day, 9:45:38", "remaining_time": "8:37:32", "throughput": 331.96, "total_tokens": 40345760} {"current_steps": 31865, "total_steps": 40000, "loss": 0.0698, "lr": 0.02959611231923031, "epoch": 1.5569589328903328, "percentage": 79.66, "elapsed_time": "1 day, 9:45:41", "remaining_time": "8:37:09", "throughput": 332.0, "total_tokens": 40351936} {"current_steps": 31870, "total_steps": 40000, "loss": 0.047, "lr": 0.029560991156303507, "epoch": 1.5572032345540272, "percentage": 79.67, "elapsed_time": "1 day, 9:45:44", "remaining_time": "8:36:45", "throughput": 332.04, "total_tokens": 40358176} {"current_steps": 31875, "total_steps": 40000, "loss": 0.0534, "lr": 0.02952588856658544, "epoch": 1.5574475362177216, "percentage": 79.69, "elapsed_time": "1 day, 9:45:47", "remaining_time": "8:36:22", "throughput": 332.09, "total_tokens": 40364864} {"current_steps": 31880, "total_steps": 40000, "loss": 0.0473, "lr": 0.029490804555489296, "epoch": 1.557691837881416, "percentage": 79.7, "elapsed_time": "1 day, 9:45:51", "remaining_time": "8:35:59", "throughput": 332.14, "total_tokens": 40371648} {"current_steps": 31885, "total_steps": 40000, "loss": 0.0517, "lr": 0.029455739128425484, "epoch": 1.5579361395451103, "percentage": 79.71, "elapsed_time": "1 day, 9:45:54", "remaining_time": "8:35:36", "throughput": 332.18, "total_tokens": 40377824} {"current_steps": 31890, "total_steps": 40000, "loss": 0.0516, "lr": 0.029420692290801607, "epoch": 1.5581804412088047, "percentage": 79.72, "elapsed_time": "1 day, 9:45:57", "remaining_time": "8:35:13", "throughput": 332.22, "total_tokens": 40384096} {"current_steps": 31895, "total_steps": 40000, "loss": 0.0737, "lr": 0.02938566404802223, "epoch": 1.558424742872499, "percentage": 79.74, "elapsed_time": "1 day, 9:46:00", "remaining_time": "8:34:50", "throughput": 332.27, "total_tokens": 40390368} {"current_steps": 31900, "total_steps": 40000, "loss": 0.0449, "lr": 0.029350654405489195, "epoch": 1.5586690445361933, "percentage": 79.75, "elapsed_time": "1 day, 9:46:03", "remaining_time": "8:34:27", "throughput": 332.31, "total_tokens": 40397088} {"current_steps": 31905, "total_steps": 40000, "loss": 0.0274, "lr": 0.02931566336860145, "epoch": 1.5589133461998876, "percentage": 79.76, "elapsed_time": "1 day, 9:46:06", "remaining_time": "8:34:04", "throughput": 332.36, "total_tokens": 40403616} {"current_steps": 31910, "total_steps": 40000, "loss": 0.0722, "lr": 0.02928069094275505, "epoch": 1.5591576478635818, "percentage": 79.77, "elapsed_time": "1 day, 9:46:09", "remaining_time": "8:33:41", "throughput": 332.4, "total_tokens": 40410176} {"current_steps": 31915, "total_steps": 40000, "loss": 0.0618, "lr": 0.02924573713334314, "epoch": 1.5594019495272762, "percentage": 79.79, "elapsed_time": "1 day, 9:46:12", "remaining_time": "8:33:17", "throughput": 332.45, "total_tokens": 40416608} {"current_steps": 31920, "total_steps": 40000, "loss": 0.0622, "lr": 0.02921080194575603, "epoch": 1.5596462511909706, "percentage": 79.8, "elapsed_time": "1 day, 9:46:15", "remaining_time": "8:32:54", "throughput": 332.49, "total_tokens": 40422816} {"current_steps": 31925, "total_steps": 40000, "loss": 0.062, "lr": 0.029175885385381177, "epoch": 1.559890552854665, "percentage": 79.81, "elapsed_time": "1 day, 9:46:18", "remaining_time": "8:32:31", "throughput": 332.53, "total_tokens": 40428928} {"current_steps": 31930, "total_steps": 40000, "loss": 0.0532, "lr": 0.029140987457603223, "epoch": 1.5601348545183593, "percentage": 79.83, "elapsed_time": "1 day, 9:46:21", "remaining_time": "8:32:08", "throughput": 332.58, "total_tokens": 40435328} {"current_steps": 31935, "total_steps": 40000, "loss": 0.0606, "lr": 0.029106108167803763, "epoch": 1.5603791561820537, "percentage": 79.84, "elapsed_time": "1 day, 9:46:24", "remaining_time": "8:31:45", "throughput": 332.62, "total_tokens": 40441472} {"current_steps": 31940, "total_steps": 40000, "loss": 0.0685, "lr": 0.029071247521361674, "epoch": 1.560623457845748, "percentage": 79.85, "elapsed_time": "1 day, 9:46:28", "remaining_time": "8:31:22", "throughput": 332.66, "total_tokens": 40447872} {"current_steps": 31945, "total_steps": 40000, "loss": 0.056, "lr": 0.029036405523652945, "epoch": 1.5608677595094422, "percentage": 79.86, "elapsed_time": "1 day, 9:46:31", "remaining_time": "8:30:59", "throughput": 332.71, "total_tokens": 40454048} {"current_steps": 31950, "total_steps": 40000, "loss": 0.0517, "lr": 0.029001582180050577, "epoch": 1.5611120611731366, "percentage": 79.88, "elapsed_time": "1 day, 9:46:34", "remaining_time": "8:30:36", "throughput": 332.75, "total_tokens": 40460736} {"current_steps": 31955, "total_steps": 40000, "loss": 0.0608, "lr": 0.02896677749592482, "epoch": 1.5613563628368308, "percentage": 79.89, "elapsed_time": "1 day, 9:46:37", "remaining_time": "8:30:13", "throughput": 332.79, "total_tokens": 40466752} {"current_steps": 31960, "total_steps": 40000, "loss": 0.0398, "lr": 0.028931991476642938, "epoch": 1.5616006645005251, "percentage": 79.9, "elapsed_time": "1 day, 9:46:40", "remaining_time": "8:29:50", "throughput": 332.84, "total_tokens": 40473312} {"current_steps": 31965, "total_steps": 40000, "loss": 0.0668, "lr": 0.028897224127569412, "epoch": 1.5618449661642195, "percentage": 79.91, "elapsed_time": "1 day, 9:46:43", "remaining_time": "8:29:27", "throughput": 332.88, "total_tokens": 40479744} {"current_steps": 31970, "total_steps": 40000, "loss": 0.0386, "lr": 0.028862475454065832, "epoch": 1.562089267827914, "percentage": 79.92, "elapsed_time": "1 day, 9:46:46", "remaining_time": "8:29:04", "throughput": 332.93, "total_tokens": 40486176} {"current_steps": 31975, "total_steps": 40000, "loss": 0.0689, "lr": 0.028827745461490806, "epoch": 1.5623335694916083, "percentage": 79.94, "elapsed_time": "1 day, 9:46:49", "remaining_time": "8:28:41", "throughput": 332.97, "total_tokens": 40492448} {"current_steps": 31980, "total_steps": 40000, "loss": 0.0575, "lr": 0.028793034155200212, "epoch": 1.5625778711553027, "percentage": 79.95, "elapsed_time": "1 day, 9:46:52", "remaining_time": "8:28:18", "throughput": 333.01, "total_tokens": 40498688} {"current_steps": 31985, "total_steps": 40000, "loss": 0.0621, "lr": 0.028758341540546944, "epoch": 1.562822172818997, "percentage": 79.96, "elapsed_time": "1 day, 9:46:55", "remaining_time": "8:27:55", "throughput": 333.06, "total_tokens": 40504800} {"current_steps": 31990, "total_steps": 40000, "loss": 0.0554, "lr": 0.02872366762288098, "epoch": 1.5630664744826912, "percentage": 79.97, "elapsed_time": "1 day, 9:46:58", "remaining_time": "8:27:32", "throughput": 333.1, "total_tokens": 40510880} {"current_steps": 31995, "total_steps": 40000, "loss": 0.0478, "lr": 0.028689012407549567, "epoch": 1.5633107761463856, "percentage": 79.99, "elapsed_time": "1 day, 9:47:01", "remaining_time": "8:27:09", "throughput": 333.14, "total_tokens": 40516896} {"current_steps": 32000, "total_steps": 40000, "loss": 0.0314, "lr": 0.028654375899896892, "epoch": 1.5635550778100797, "percentage": 80.0, "elapsed_time": "1 day, 9:47:04", "remaining_time": "8:26:46", "throughput": 333.18, "total_tokens": 40522848} {"current_steps": 32000, "total_steps": 40000, "eval_loss": 0.061254024505615234, "epoch": 1.5635550778100797, "percentage": 80.0, "elapsed_time": "1 day, 9:57:42", "remaining_time": "8:29:25", "throughput": 331.44, "total_tokens": 40522848} {"current_steps": 32005, "total_steps": 40000, "loss": 0.0417, "lr": 0.02861975810526437, "epoch": 1.5637993794737741, "percentage": 80.01, "elapsed_time": "1 day, 9:57:46", "remaining_time": "8:29:02", "throughput": 331.48, "total_tokens": 40529408} {"current_steps": 32010, "total_steps": 40000, "loss": 0.0871, "lr": 0.02858515902899056, "epoch": 1.5640436811374685, "percentage": 80.03, "elapsed_time": "1 day, 9:57:49", "remaining_time": "8:28:39", "throughput": 331.53, "total_tokens": 40535584} {"current_steps": 32015, "total_steps": 40000, "loss": 0.0384, "lr": 0.028550578676410976, "epoch": 1.5642879828011629, "percentage": 80.04, "elapsed_time": "1 day, 9:57:52", "remaining_time": "8:28:16", "throughput": 331.58, "total_tokens": 40542784} {"current_steps": 32020, "total_steps": 40000, "loss": 0.0412, "lr": 0.02851601705285837, "epoch": 1.5645322844648573, "percentage": 80.05, "elapsed_time": "1 day, 9:57:55", "remaining_time": "8:27:53", "throughput": 331.62, "total_tokens": 40548960} {"current_steps": 32025, "total_steps": 40000, "loss": 0.0685, "lr": 0.028481474163662666, "epoch": 1.5647765861285516, "percentage": 80.06, "elapsed_time": "1 day, 9:57:58", "remaining_time": "8:27:30", "throughput": 331.66, "total_tokens": 40554848} {"current_steps": 32030, "total_steps": 40000, "loss": 0.074, "lr": 0.028446950014150683, "epoch": 1.565020887792246, "percentage": 80.08, "elapsed_time": "1 day, 9:58:01", "remaining_time": "8:27:07", "throughput": 331.7, "total_tokens": 40561248} {"current_steps": 32035, "total_steps": 40000, "loss": 0.067, "lr": 0.028412444609646596, "epoch": 1.5652651894559402, "percentage": 80.09, "elapsed_time": "1 day, 9:58:05", "remaining_time": "8:26:44", "throughput": 331.75, "total_tokens": 40567616} {"current_steps": 32040, "total_steps": 40000, "loss": 0.0524, "lr": 0.028377957955471465, "epoch": 1.5655094911196346, "percentage": 80.1, "elapsed_time": "1 day, 9:58:08", "remaining_time": "8:26:21", "throughput": 331.79, "total_tokens": 40573664} {"current_steps": 32045, "total_steps": 40000, "loss": 0.073, "lr": 0.0283434900569436, "epoch": 1.5657537927833287, "percentage": 80.11, "elapsed_time": "1 day, 9:58:11", "remaining_time": "8:25:58", "throughput": 331.83, "total_tokens": 40579936} {"current_steps": 32050, "total_steps": 40000, "loss": 0.0516, "lr": 0.028309040919378456, "epoch": 1.565998094447023, "percentage": 80.12, "elapsed_time": "1 day, 9:58:14", "remaining_time": "8:25:35", "throughput": 331.87, "total_tokens": 40586016} {"current_steps": 32055, "total_steps": 40000, "loss": 0.0664, "lr": 0.02827461054808848, "epoch": 1.5662423961107175, "percentage": 80.14, "elapsed_time": "1 day, 9:58:17", "remaining_time": "8:25:12", "throughput": 331.91, "total_tokens": 40592192} {"current_steps": 32060, "total_steps": 40000, "loss": 0.0657, "lr": 0.028240198948383186, "epoch": 1.5664866977744119, "percentage": 80.15, "elapsed_time": "1 day, 9:58:20", "remaining_time": "8:24:48", "throughput": 331.95, "total_tokens": 40598080} {"current_steps": 32065, "total_steps": 40000, "loss": 0.0924, "lr": 0.028205806125569402, "epoch": 1.5667309994381062, "percentage": 80.16, "elapsed_time": "1 day, 9:58:23", "remaining_time": "8:24:25", "throughput": 331.99, "total_tokens": 40603776} {"current_steps": 32070, "total_steps": 40000, "loss": 0.0572, "lr": 0.028171432084950834, "epoch": 1.5669753011018006, "percentage": 80.17, "elapsed_time": "1 day, 9:58:26", "remaining_time": "8:24:02", "throughput": 332.03, "total_tokens": 40609888} {"current_steps": 32075, "total_steps": 40000, "loss": 0.0611, "lr": 0.028137076831828478, "epoch": 1.567219602765495, "percentage": 80.19, "elapsed_time": "1 day, 9:58:29", "remaining_time": "8:23:39", "throughput": 332.07, "total_tokens": 40615840} {"current_steps": 32080, "total_steps": 40000, "loss": 0.0763, "lr": 0.028102740371500238, "epoch": 1.5674639044291891, "percentage": 80.2, "elapsed_time": "1 day, 9:58:32", "remaining_time": "8:23:16", "throughput": 332.12, "total_tokens": 40622112} {"current_steps": 32085, "total_steps": 40000, "loss": 0.0468, "lr": 0.0280684227092613, "epoch": 1.5677082060928835, "percentage": 80.21, "elapsed_time": "1 day, 9:58:35", "remaining_time": "8:22:53", "throughput": 332.16, "total_tokens": 40628512} {"current_steps": 32090, "total_steps": 40000, "loss": 0.0508, "lr": 0.02803412385040392, "epoch": 1.5679525077565777, "percentage": 80.23, "elapsed_time": "1 day, 9:58:38", "remaining_time": "8:22:30", "throughput": 332.2, "total_tokens": 40634752} {"current_steps": 32095, "total_steps": 40000, "loss": 0.0272, "lr": 0.027999843800217306, "epoch": 1.568196809420272, "percentage": 80.24, "elapsed_time": "1 day, 9:58:41", "remaining_time": "8:22:07", "throughput": 332.25, "total_tokens": 40641664} {"current_steps": 32100, "total_steps": 40000, "loss": 0.0586, "lr": 0.027965582563987932, "epoch": 1.5684411110839664, "percentage": 80.25, "elapsed_time": "1 day, 9:58:44", "remaining_time": "8:21:44", "throughput": 332.29, "total_tokens": 40647808} {"current_steps": 32105, "total_steps": 40000, "loss": 0.0595, "lr": 0.027931340146999346, "epoch": 1.5686854127476608, "percentage": 80.26, "elapsed_time": "1 day, 9:58:47", "remaining_time": "8:21:21", "throughput": 332.34, "total_tokens": 40654400} {"current_steps": 32110, "total_steps": 40000, "loss": 0.0383, "lr": 0.02789711655453208, "epoch": 1.5689297144113552, "percentage": 80.27, "elapsed_time": "1 day, 9:58:51", "remaining_time": "8:20:58", "throughput": 332.39, "total_tokens": 40661344} {"current_steps": 32115, "total_steps": 40000, "loss": 0.046, "lr": 0.02786291179186392, "epoch": 1.5691740160750496, "percentage": 80.29, "elapsed_time": "1 day, 9:58:54", "remaining_time": "8:20:35", "throughput": 332.43, "total_tokens": 40667136} {"current_steps": 32120, "total_steps": 40000, "loss": 0.048, "lr": 0.02782872586426961, "epoch": 1.569418317738744, "percentage": 80.3, "elapsed_time": "1 day, 9:58:57", "remaining_time": "8:20:12", "throughput": 332.47, "total_tokens": 40673472} {"current_steps": 32125, "total_steps": 40000, "loss": 0.0497, "lr": 0.027794558777021083, "epoch": 1.5696626194024381, "percentage": 80.31, "elapsed_time": "1 day, 9:59:00", "remaining_time": "8:19:50", "throughput": 332.52, "total_tokens": 40680608} {"current_steps": 32130, "total_steps": 40000, "loss": 0.0556, "lr": 0.02776041053538734, "epoch": 1.5699069210661325, "percentage": 80.33, "elapsed_time": "1 day, 9:59:03", "remaining_time": "8:19:27", "throughput": 332.56, "total_tokens": 40686624} {"current_steps": 32135, "total_steps": 40000, "loss": 0.0954, "lr": 0.027726281144634407, "epoch": 1.5701512227298267, "percentage": 80.34, "elapsed_time": "1 day, 9:59:06", "remaining_time": "8:19:04", "throughput": 332.6, "total_tokens": 40692800} {"current_steps": 32140, "total_steps": 40000, "loss": 0.0509, "lr": 0.02769217061002552, "epoch": 1.570395524393521, "percentage": 80.35, "elapsed_time": "1 day, 9:59:09", "remaining_time": "8:18:41", "throughput": 332.65, "total_tokens": 40699296} {"current_steps": 32145, "total_steps": 40000, "loss": 0.0612, "lr": 0.027658078936820967, "epoch": 1.5706398260572154, "percentage": 80.36, "elapsed_time": "1 day, 9:59:12", "remaining_time": "8:18:18", "throughput": 332.69, "total_tokens": 40704864} {"current_steps": 32150, "total_steps": 40000, "loss": 0.0473, "lr": 0.02762400613027805, "epoch": 1.5708841277209098, "percentage": 80.38, "elapsed_time": "1 day, 9:59:15", "remaining_time": "8:17:55", "throughput": 332.73, "total_tokens": 40711456} {"current_steps": 32155, "total_steps": 40000, "loss": 0.0813, "lr": 0.027589952195651295, "epoch": 1.5711284293846042, "percentage": 80.39, "elapsed_time": "1 day, 9:59:18", "remaining_time": "8:17:32", "throughput": 332.78, "total_tokens": 40718016} {"current_steps": 32160, "total_steps": 40000, "loss": 0.0351, "lr": 0.027555917138192186, "epoch": 1.5713727310482986, "percentage": 80.4, "elapsed_time": "1 day, 9:59:21", "remaining_time": "8:17:09", "throughput": 332.82, "total_tokens": 40724224} {"current_steps": 32165, "total_steps": 40000, "loss": 0.0672, "lr": 0.027521900963149375, "epoch": 1.571617032711993, "percentage": 80.41, "elapsed_time": "1 day, 9:59:24", "remaining_time": "8:16:46", "throughput": 332.86, "total_tokens": 40730400} {"current_steps": 32170, "total_steps": 40000, "loss": 0.0478, "lr": 0.027487903675768633, "epoch": 1.571861334375687, "percentage": 80.42, "elapsed_time": "1 day, 9:59:27", "remaining_time": "8:16:23", "throughput": 332.9, "total_tokens": 40736576} {"current_steps": 32175, "total_steps": 40000, "loss": 0.0606, "lr": 0.027453925281292677, "epoch": 1.5721056360393815, "percentage": 80.44, "elapsed_time": "1 day, 9:59:31", "remaining_time": "8:16:00", "throughput": 332.95, "total_tokens": 40743136} {"current_steps": 32180, "total_steps": 40000, "loss": 0.0575, "lr": 0.027419965784961475, "epoch": 1.5723499377030756, "percentage": 80.45, "elapsed_time": "1 day, 9:59:34", "remaining_time": "8:15:37", "throughput": 332.99, "total_tokens": 40749728} {"current_steps": 32185, "total_steps": 40000, "loss": 0.0704, "lr": 0.027386025192012015, "epoch": 1.57259423936677, "percentage": 80.46, "elapsed_time": "1 day, 9:59:37", "remaining_time": "8:15:15", "throughput": 333.03, "total_tokens": 40755616} {"current_steps": 32190, "total_steps": 40000, "loss": 0.0665, "lr": 0.027352103507678277, "epoch": 1.5728385410304644, "percentage": 80.47, "elapsed_time": "1 day, 9:59:40", "remaining_time": "8:14:52", "throughput": 333.08, "total_tokens": 40762304} {"current_steps": 32195, "total_steps": 40000, "loss": 0.0503, "lr": 0.027318200737191527, "epoch": 1.5730828426941588, "percentage": 80.49, "elapsed_time": "1 day, 9:59:43", "remaining_time": "8:14:29", "throughput": 333.12, "total_tokens": 40768928} {"current_steps": 32200, "total_steps": 40000, "loss": 0.0831, "lr": 0.027284316885779935, "epoch": 1.5733271443578531, "percentage": 80.5, "elapsed_time": "1 day, 9:59:46", "remaining_time": "8:14:06", "throughput": 333.17, "total_tokens": 40775072} {"current_steps": 32200, "total_steps": 40000, "eval_loss": 0.06093883514404297, "epoch": 1.5733271443578531, "percentage": 80.5, "elapsed_time": "1 day, 10:10:24", "remaining_time": "8:16:41", "throughput": 331.44, "total_tokens": 40775072} {"current_steps": 32205, "total_steps": 40000, "loss": 0.067, "lr": 0.027250451958668785, "epoch": 1.5735714460215475, "percentage": 80.51, "elapsed_time": "1 day, 10:10:29", "remaining_time": "8:16:18", "throughput": 331.48, "total_tokens": 40781632} {"current_steps": 32210, "total_steps": 40000, "loss": 0.055, "lr": 0.027216605961080536, "epoch": 1.5738157476852417, "percentage": 80.53, "elapsed_time": "1 day, 10:10:32", "remaining_time": "8:15:55", "throughput": 331.53, "total_tokens": 40788576} {"current_steps": 32215, "total_steps": 40000, "loss": 0.0922, "lr": 0.02718277889823461, "epoch": 1.574060049348936, "percentage": 80.54, "elapsed_time": "1 day, 10:10:35", "remaining_time": "8:15:32", "throughput": 331.57, "total_tokens": 40794976} {"current_steps": 32220, "total_steps": 40000, "loss": 0.0368, "lr": 0.027148970775347604, "epoch": 1.5743043510126304, "percentage": 80.55, "elapsed_time": "1 day, 10:10:38", "remaining_time": "8:15:09", "throughput": 331.61, "total_tokens": 40801440} {"current_steps": 32225, "total_steps": 40000, "loss": 0.0802, "lr": 0.027115181597633174, "epoch": 1.5745486526763246, "percentage": 80.56, "elapsed_time": "1 day, 10:10:41", "remaining_time": "8:14:46", "throughput": 331.66, "total_tokens": 40807456} {"current_steps": 32230, "total_steps": 40000, "loss": 0.0724, "lr": 0.027081411370301976, "epoch": 1.574792954340019, "percentage": 80.58, "elapsed_time": "1 day, 10:10:44", "remaining_time": "8:14:23", "throughput": 331.69, "total_tokens": 40813280} {"current_steps": 32235, "total_steps": 40000, "loss": 0.0801, "lr": 0.027047660098561875, "epoch": 1.5750372560037134, "percentage": 80.59, "elapsed_time": "1 day, 10:10:47", "remaining_time": "8:14:00", "throughput": 331.74, "total_tokens": 40819584} {"current_steps": 32240, "total_steps": 40000, "loss": 0.0449, "lr": 0.02701392778761766, "epoch": 1.5752815576674077, "percentage": 80.6, "elapsed_time": "1 day, 10:10:51", "remaining_time": "8:13:37", "throughput": 331.78, "total_tokens": 40826080} {"current_steps": 32245, "total_steps": 40000, "loss": 0.0834, "lr": 0.02698021444267133, "epoch": 1.5755258593311021, "percentage": 80.61, "elapsed_time": "1 day, 10:10:54", "remaining_time": "8:13:14", "throughput": 331.83, "total_tokens": 40832576} {"current_steps": 32250, "total_steps": 40000, "loss": 0.0403, "lr": 0.026946520068921915, "epoch": 1.5757701609947965, "percentage": 80.62, "elapsed_time": "1 day, 10:10:57", "remaining_time": "8:12:51", "throughput": 331.87, "total_tokens": 40839072} {"current_steps": 32255, "total_steps": 40000, "loss": 0.0773, "lr": 0.02691284467156547, "epoch": 1.5760144626584907, "percentage": 80.64, "elapsed_time": "1 day, 10:11:00", "remaining_time": "8:12:29", "throughput": 331.92, "total_tokens": 40845728} {"current_steps": 32260, "total_steps": 40000, "loss": 0.093, "lr": 0.026879188255795182, "epoch": 1.576258764322185, "percentage": 80.65, "elapsed_time": "1 day, 10:11:03", "remaining_time": "8:12:06", "throughput": 331.96, "total_tokens": 40852256} {"current_steps": 32265, "total_steps": 40000, "loss": 0.0467, "lr": 0.026845550826801328, "epoch": 1.5765030659858794, "percentage": 80.66, "elapsed_time": "1 day, 10:11:06", "remaining_time": "8:11:43", "throughput": 332.0, "total_tokens": 40858528} {"current_steps": 32270, "total_steps": 40000, "loss": 0.0638, "lr": 0.02681193238977121, "epoch": 1.5767473676495736, "percentage": 80.67, "elapsed_time": "1 day, 10:11:09", "remaining_time": "8:11:20", "throughput": 332.05, "total_tokens": 40864736} {"current_steps": 32275, "total_steps": 40000, "loss": 0.0465, "lr": 0.026778332949889145, "epoch": 1.576991669313268, "percentage": 80.69, "elapsed_time": "1 day, 10:11:12", "remaining_time": "8:10:57", "throughput": 332.09, "total_tokens": 40871520} {"current_steps": 32280, "total_steps": 40000, "loss": 0.09, "lr": 0.026744752512336673, "epoch": 1.5772359709769623, "percentage": 80.7, "elapsed_time": "1 day, 10:11:15", "remaining_time": "8:10:34", "throughput": 332.14, "total_tokens": 40877920} {"current_steps": 32285, "total_steps": 40000, "loss": 0.05, "lr": 0.02671119108229225, "epoch": 1.5774802726406567, "percentage": 80.71, "elapsed_time": "1 day, 10:11:18", "remaining_time": "8:10:11", "throughput": 332.18, "total_tokens": 40883808} {"current_steps": 32290, "total_steps": 40000, "loss": 0.0349, "lr": 0.026677648664931556, "epoch": 1.577724574304351, "percentage": 80.73, "elapsed_time": "1 day, 10:11:21", "remaining_time": "8:09:48", "throughput": 332.22, "total_tokens": 40890176} {"current_steps": 32295, "total_steps": 40000, "loss": 0.0508, "lr": 0.026644125265427154, "epoch": 1.5779688759680455, "percentage": 80.74, "elapsed_time": "1 day, 10:11:25", "remaining_time": "8:09:25", "throughput": 332.26, "total_tokens": 40896256} {"current_steps": 32300, "total_steps": 40000, "loss": 0.0473, "lr": 0.026610620888948822, "epoch": 1.5782131776317396, "percentage": 80.75, "elapsed_time": "1 day, 10:11:28", "remaining_time": "8:09:03", "throughput": 332.31, "total_tokens": 40903296} {"current_steps": 32305, "total_steps": 40000, "loss": 0.0486, "lr": 0.026577135540663408, "epoch": 1.578457479295434, "percentage": 80.76, "elapsed_time": "1 day, 10:11:31", "remaining_time": "8:08:40", "throughput": 332.35, "total_tokens": 40909696} {"current_steps": 32310, "total_steps": 40000, "loss": 0.0467, "lr": 0.026543669225734673, "epoch": 1.5787017809591284, "percentage": 80.77, "elapsed_time": "1 day, 10:11:34", "remaining_time": "8:08:17", "throughput": 332.4, "total_tokens": 40916864} {"current_steps": 32315, "total_steps": 40000, "loss": 0.0594, "lr": 0.02651022194932363, "epoch": 1.5789460826228225, "percentage": 80.79, "elapsed_time": "1 day, 10:11:37", "remaining_time": "8:07:54", "throughput": 332.45, "total_tokens": 40923456} {"current_steps": 32320, "total_steps": 40000, "loss": 0.075, "lr": 0.026476793716588194, "epoch": 1.579190384286517, "percentage": 80.8, "elapsed_time": "1 day, 10:11:40", "remaining_time": "8:07:31", "throughput": 332.5, "total_tokens": 40930560} {"current_steps": 32325, "total_steps": 40000, "loss": 0.0353, "lr": 0.026443384532683467, "epoch": 1.5794346859502113, "percentage": 80.81, "elapsed_time": "1 day, 10:11:43", "remaining_time": "8:07:08", "throughput": 332.54, "total_tokens": 40937216} {"current_steps": 32330, "total_steps": 40000, "loss": 0.0455, "lr": 0.026409994402761584, "epoch": 1.5796789876139057, "percentage": 80.83, "elapsed_time": "1 day, 10:11:47", "remaining_time": "8:06:46", "throughput": 332.59, "total_tokens": 40943936} {"current_steps": 32335, "total_steps": 40000, "loss": 0.059, "lr": 0.026376623331971653, "epoch": 1.5799232892776, "percentage": 80.84, "elapsed_time": "1 day, 10:11:50", "remaining_time": "8:06:23", "throughput": 332.63, "total_tokens": 40950080} {"current_steps": 32340, "total_steps": 40000, "loss": 0.0465, "lr": 0.026343271325459997, "epoch": 1.5801675909412944, "percentage": 80.85, "elapsed_time": "1 day, 10:11:53", "remaining_time": "8:06:00", "throughput": 332.67, "total_tokens": 40956128} {"current_steps": 32345, "total_steps": 40000, "loss": 0.0375, "lr": 0.02630993838836987, "epoch": 1.5804118926049886, "percentage": 80.86, "elapsed_time": "1 day, 10:11:56", "remaining_time": "8:05:37", "throughput": 332.71, "total_tokens": 40962592} {"current_steps": 32350, "total_steps": 40000, "loss": 0.0503, "lr": 0.026276624525841584, "epoch": 1.580656194268683, "percentage": 80.88, "elapsed_time": "1 day, 10:11:59", "remaining_time": "8:05:14", "throughput": 332.76, "total_tokens": 40969184} {"current_steps": 32355, "total_steps": 40000, "loss": 0.0532, "lr": 0.026243329743012637, "epoch": 1.5809004959323771, "percentage": 80.89, "elapsed_time": "1 day, 10:12:02", "remaining_time": "8:04:51", "throughput": 332.81, "total_tokens": 40976000} {"current_steps": 32360, "total_steps": 40000, "loss": 0.0436, "lr": 0.026210054045017438, "epoch": 1.5811447975960715, "percentage": 80.9, "elapsed_time": "1 day, 10:12:05", "remaining_time": "8:04:29", "throughput": 332.85, "total_tokens": 40982336} {"current_steps": 32365, "total_steps": 40000, "loss": 0.0567, "lr": 0.02617679743698755, "epoch": 1.581389099259766, "percentage": 80.91, "elapsed_time": "1 day, 10:12:08", "remaining_time": "8:04:06", "throughput": 332.89, "total_tokens": 40988384} {"current_steps": 32370, "total_steps": 40000, "loss": 0.0703, "lr": 0.02614355992405158, "epoch": 1.5816334009234603, "percentage": 80.92, "elapsed_time": "1 day, 10:12:11", "remaining_time": "8:03:43", "throughput": 332.93, "total_tokens": 40994144} {"current_steps": 32375, "total_steps": 40000, "loss": 0.0504, "lr": 0.026110341511335115, "epoch": 1.5818777025871547, "percentage": 80.94, "elapsed_time": "1 day, 10:12:14", "remaining_time": "8:03:20", "throughput": 332.97, "total_tokens": 41000736} {"current_steps": 32380, "total_steps": 40000, "loss": 0.0292, "lr": 0.02607714220396093, "epoch": 1.582122004250849, "percentage": 80.95, "elapsed_time": "1 day, 10:12:17", "remaining_time": "8:02:58", "throughput": 333.01, "total_tokens": 41006528} {"current_steps": 32385, "total_steps": 40000, "loss": 0.0301, "lr": 0.02604396200704869, "epoch": 1.5823663059145434, "percentage": 80.96, "elapsed_time": "1 day, 10:12:20", "remaining_time": "8:02:35", "throughput": 333.06, "total_tokens": 41012960} {"current_steps": 32390, "total_steps": 40000, "loss": 0.053, "lr": 0.02601080092571523, "epoch": 1.5826106075782376, "percentage": 80.97, "elapsed_time": "1 day, 10:12:23", "remaining_time": "8:02:12", "throughput": 333.1, "total_tokens": 41018784} {"current_steps": 32395, "total_steps": 40000, "loss": 0.0619, "lr": 0.025977658965074455, "epoch": 1.582854909241932, "percentage": 80.99, "elapsed_time": "1 day, 10:12:26", "remaining_time": "8:01:49", "throughput": 333.14, "total_tokens": 41025056} {"current_steps": 32400, "total_steps": 40000, "loss": 0.0628, "lr": 0.02594453613023719, "epoch": 1.583099210905626, "percentage": 81.0, "elapsed_time": "1 day, 10:12:29", "remaining_time": "8:01:26", "throughput": 333.18, "total_tokens": 41031296} {"current_steps": 32400, "total_steps": 40000, "eval_loss": 0.061447326093912125, "epoch": 1.583099210905626, "percentage": 81.0, "elapsed_time": "1 day, 10:23:04", "remaining_time": "8:03:55", "throughput": 331.47, "total_tokens": 41031296} {"current_steps": 32405, "total_steps": 40000, "loss": 0.0655, "lr": 0.025911432426311443, "epoch": 1.5833435125693205, "percentage": 81.01, "elapsed_time": "1 day, 10:23:08", "remaining_time": "8:03:33", "throughput": 331.51, "total_tokens": 41037184} {"current_steps": 32410, "total_steps": 40000, "loss": 0.0546, "lr": 0.025878347858402234, "epoch": 1.5835878142330149, "percentage": 81.03, "elapsed_time": "1 day, 10:23:11", "remaining_time": "8:03:10", "throughput": 331.55, "total_tokens": 41043424} {"current_steps": 32415, "total_steps": 40000, "loss": 0.0707, "lr": 0.025845282431611598, "epoch": 1.5838321158967092, "percentage": 81.04, "elapsed_time": "1 day, 10:23:14", "remaining_time": "8:02:47", "throughput": 331.6, "total_tokens": 41049824} {"current_steps": 32420, "total_steps": 40000, "loss": 0.0485, "lr": 0.025812236151038608, "epoch": 1.5840764175604036, "percentage": 81.05, "elapsed_time": "1 day, 10:23:17", "remaining_time": "8:02:24", "throughput": 331.64, "total_tokens": 41056064} {"current_steps": 32425, "total_steps": 40000, "loss": 0.0351, "lr": 0.025779209021779468, "epoch": 1.584320719224098, "percentage": 81.06, "elapsed_time": "1 day, 10:23:20", "remaining_time": "8:02:01", "throughput": 331.68, "total_tokens": 41062208} {"current_steps": 32430, "total_steps": 40000, "loss": 0.0506, "lr": 0.025746201048927324, "epoch": 1.5845650208877924, "percentage": 81.08, "elapsed_time": "1 day, 10:23:23", "remaining_time": "8:01:39", "throughput": 331.72, "total_tokens": 41068320} {"current_steps": 32435, "total_steps": 40000, "loss": 0.0385, "lr": 0.025713212237572485, "epoch": 1.5848093225514865, "percentage": 81.09, "elapsed_time": "1 day, 10:23:26", "remaining_time": "8:01:16", "throughput": 331.76, "total_tokens": 41074688} {"current_steps": 32440, "total_steps": 40000, "loss": 0.0682, "lr": 0.025680242592802164, "epoch": 1.585053624215181, "percentage": 81.1, "elapsed_time": "1 day, 10:23:30", "remaining_time": "8:00:53", "throughput": 331.81, "total_tokens": 41081088} {"current_steps": 32445, "total_steps": 40000, "loss": 0.053, "lr": 0.02564729211970073, "epoch": 1.585297925878875, "percentage": 81.11, "elapsed_time": "1 day, 10:23:33", "remaining_time": "8:00:30", "throughput": 331.85, "total_tokens": 41087456} {"current_steps": 32450, "total_steps": 40000, "loss": 0.0558, "lr": 0.025614360823349617, "epoch": 1.5855422275425695, "percentage": 81.12, "elapsed_time": "1 day, 10:23:36", "remaining_time": "8:00:07", "throughput": 331.89, "total_tokens": 41093920} {"current_steps": 32455, "total_steps": 40000, "loss": 0.059, "lr": 0.025581448708827146, "epoch": 1.5857865292062638, "percentage": 81.14, "elapsed_time": "1 day, 10:23:39", "remaining_time": "7:59:45", "throughput": 331.94, "total_tokens": 41100128} {"current_steps": 32460, "total_steps": 40000, "loss": 0.0399, "lr": 0.025548555781208876, "epoch": 1.5860308308699582, "percentage": 81.15, "elapsed_time": "1 day, 10:23:42", "remaining_time": "7:59:22", "throughput": 331.98, "total_tokens": 41106784} {"current_steps": 32465, "total_steps": 40000, "loss": 0.0512, "lr": 0.02551568204556721, "epoch": 1.5862751325336526, "percentage": 81.16, "elapsed_time": "1 day, 10:23:45", "remaining_time": "7:58:59", "throughput": 332.02, "total_tokens": 41113088} {"current_steps": 32470, "total_steps": 40000, "loss": 0.0469, "lr": 0.02548282750697173, "epoch": 1.586519434197347, "percentage": 81.17, "elapsed_time": "1 day, 10:23:48", "remaining_time": "7:58:36", "throughput": 332.07, "total_tokens": 41119584} {"current_steps": 32475, "total_steps": 40000, "loss": 0.0674, "lr": 0.02544999217048909, "epoch": 1.5867637358610414, "percentage": 81.19, "elapsed_time": "1 day, 10:23:51", "remaining_time": "7:58:13", "throughput": 332.11, "total_tokens": 41126144} {"current_steps": 32480, "total_steps": 40000, "loss": 0.0626, "lr": 0.025417176041182793, "epoch": 1.5870080375247355, "percentage": 81.2, "elapsed_time": "1 day, 10:23:54", "remaining_time": "7:57:51", "throughput": 332.15, "total_tokens": 41131840} {"current_steps": 32485, "total_steps": 40000, "loss": 0.0403, "lr": 0.025384379124113596, "epoch": 1.58725233918843, "percentage": 81.21, "elapsed_time": "1 day, 10:23:57", "remaining_time": "7:57:28", "throughput": 332.19, "total_tokens": 41137792} {"current_steps": 32490, "total_steps": 40000, "loss": 0.0558, "lr": 0.025351601424339124, "epoch": 1.587496640852124, "percentage": 81.23, "elapsed_time": "1 day, 10:24:00", "remaining_time": "7:57:05", "throughput": 332.24, "total_tokens": 41144640} {"current_steps": 32495, "total_steps": 40000, "loss": 0.0494, "lr": 0.025318842946914184, "epoch": 1.5877409425158184, "percentage": 81.24, "elapsed_time": "1 day, 10:24:04", "remaining_time": "7:56:42", "throughput": 332.28, "total_tokens": 41151232} {"current_steps": 32500, "total_steps": 40000, "loss": 0.0466, "lr": 0.025286103696890494, "epoch": 1.5879852441795128, "percentage": 81.25, "elapsed_time": "1 day, 10:24:07", "remaining_time": "7:56:20", "throughput": 332.33, "total_tokens": 41157504} {"current_steps": 32505, "total_steps": 40000, "loss": 0.0668, "lr": 0.025253383679316836, "epoch": 1.5882295458432072, "percentage": 81.26, "elapsed_time": "1 day, 10:24:10", "remaining_time": "7:55:57", "throughput": 332.37, "total_tokens": 41164160} {"current_steps": 32510, "total_steps": 40000, "loss": 0.0438, "lr": 0.025220682899239077, "epoch": 1.5884738475069016, "percentage": 81.27, "elapsed_time": "1 day, 10:24:13", "remaining_time": "7:55:34", "throughput": 332.41, "total_tokens": 41170048} {"current_steps": 32515, "total_steps": 40000, "loss": 0.0746, "lr": 0.02518800136170013, "epoch": 1.588718149170596, "percentage": 81.29, "elapsed_time": "1 day, 10:24:16", "remaining_time": "7:55:11", "throughput": 332.45, "total_tokens": 41176288} {"current_steps": 32520, "total_steps": 40000, "loss": 0.0695, "lr": 0.02515533907173981, "epoch": 1.5889624508342903, "percentage": 81.3, "elapsed_time": "1 day, 10:24:19", "remaining_time": "7:54:49", "throughput": 332.5, "total_tokens": 41183136} {"current_steps": 32525, "total_steps": 40000, "loss": 0.0539, "lr": 0.025122696034395115, "epoch": 1.5892067524979845, "percentage": 81.31, "elapsed_time": "1 day, 10:24:22", "remaining_time": "7:54:26", "throughput": 332.54, "total_tokens": 41189120} {"current_steps": 32530, "total_steps": 40000, "loss": 0.0487, "lr": 0.025090072254700023, "epoch": 1.5894510541616789, "percentage": 81.33, "elapsed_time": "1 day, 10:24:25", "remaining_time": "7:54:03", "throughput": 332.59, "total_tokens": 41195840} {"current_steps": 32535, "total_steps": 40000, "loss": 0.0787, "lr": 0.025057467737685468, "epoch": 1.589695355825373, "percentage": 81.34, "elapsed_time": "1 day, 10:24:28", "remaining_time": "7:53:41", "throughput": 332.63, "total_tokens": 41201920} {"current_steps": 32540, "total_steps": 40000, "loss": 0.047, "lr": 0.025024882488379557, "epoch": 1.5899396574890674, "percentage": 81.35, "elapsed_time": "1 day, 10:24:31", "remaining_time": "7:53:18", "throughput": 332.67, "total_tokens": 41208608} {"current_steps": 32545, "total_steps": 40000, "loss": 0.067, "lr": 0.02499231651180727, "epoch": 1.5901839591527618, "percentage": 81.36, "elapsed_time": "1 day, 10:24:34", "remaining_time": "7:52:55", "throughput": 332.72, "total_tokens": 41215424} {"current_steps": 32550, "total_steps": 40000, "loss": 0.043, "lr": 0.024959769812990713, "epoch": 1.5904282608164562, "percentage": 81.38, "elapsed_time": "1 day, 10:24:37", "remaining_time": "7:52:32", "throughput": 332.76, "total_tokens": 41221600} {"current_steps": 32555, "total_steps": 40000, "loss": 0.0611, "lr": 0.024927242396949045, "epoch": 1.5906725624801505, "percentage": 81.39, "elapsed_time": "1 day, 10:24:40", "remaining_time": "7:52:10", "throughput": 332.8, "total_tokens": 41227680} {"current_steps": 32560, "total_steps": 40000, "loss": 0.0651, "lr": 0.02489473426869836, "epoch": 1.590916864143845, "percentage": 81.4, "elapsed_time": "1 day, 10:24:44", "remaining_time": "7:51:47", "throughput": 332.85, "total_tokens": 41234304} {"current_steps": 32565, "total_steps": 40000, "loss": 0.0746, "lr": 0.024862245433251776, "epoch": 1.5911611658075393, "percentage": 81.41, "elapsed_time": "1 day, 10:24:47", "remaining_time": "7:51:25", "throughput": 332.89, "total_tokens": 41240960} {"current_steps": 32570, "total_steps": 40000, "loss": 0.0338, "lr": 0.024829775895619577, "epoch": 1.5914054674712335, "percentage": 81.42, "elapsed_time": "1 day, 10:24:50", "remaining_time": "7:51:02", "throughput": 332.94, "total_tokens": 41247744} {"current_steps": 32575, "total_steps": 40000, "loss": 0.0522, "lr": 0.024797325660808882, "epoch": 1.5916497691349278, "percentage": 81.44, "elapsed_time": "1 day, 10:24:53", "remaining_time": "7:50:39", "throughput": 332.98, "total_tokens": 41254560} {"current_steps": 32580, "total_steps": 40000, "loss": 0.0816, "lr": 0.02476489473382401, "epoch": 1.591894070798622, "percentage": 81.45, "elapsed_time": "1 day, 10:24:56", "remaining_time": "7:50:17", "throughput": 333.03, "total_tokens": 41261120} {"current_steps": 32585, "total_steps": 40000, "loss": 0.0504, "lr": 0.024732483119666127, "epoch": 1.5921383724623164, "percentage": 81.46, "elapsed_time": "1 day, 10:24:59", "remaining_time": "7:49:54", "throughput": 333.07, "total_tokens": 41267904} {"current_steps": 32590, "total_steps": 40000, "loss": 0.0381, "lr": 0.024700090823333548, "epoch": 1.5923826741260108, "percentage": 81.47, "elapsed_time": "1 day, 10:25:02", "remaining_time": "7:49:31", "throughput": 333.12, "total_tokens": 41274720} {"current_steps": 32595, "total_steps": 40000, "loss": 0.0749, "lr": 0.02466771784982163, "epoch": 1.5926269757897051, "percentage": 81.49, "elapsed_time": "1 day, 10:25:06", "remaining_time": "7:49:09", "throughput": 333.16, "total_tokens": 41280928} {"current_steps": 32600, "total_steps": 40000, "loss": 0.0856, "lr": 0.024635364204122594, "epoch": 1.5928712774533995, "percentage": 81.5, "elapsed_time": "1 day, 10:25:09", "remaining_time": "7:48:46", "throughput": 333.21, "total_tokens": 41287200} {"current_steps": 32600, "total_steps": 40000, "eval_loss": 0.061915721744298935, "epoch": 1.5928712774533995, "percentage": 81.5, "elapsed_time": "1 day, 10:35:42", "remaining_time": "7:51:10", "throughput": 331.51, "total_tokens": 41287200} {"current_steps": 32605, "total_steps": 40000, "loss": 0.0527, "lr": 0.024603029891225852, "epoch": 1.593115579117094, "percentage": 81.51, "elapsed_time": "1 day, 10:35:49", "remaining_time": "7:50:48", "throughput": 331.54, "total_tokens": 41293472} {"current_steps": 32610, "total_steps": 40000, "loss": 0.0681, "lr": 0.024570714916117748, "epoch": 1.5933598807807883, "percentage": 81.53, "elapsed_time": "1 day, 10:35:52", "remaining_time": "7:50:25", "throughput": 331.58, "total_tokens": 41299552} {"current_steps": 32615, "total_steps": 40000, "loss": 0.0617, "lr": 0.024538419283781625, "epoch": 1.5936041824444824, "percentage": 81.54, "elapsed_time": "1 day, 10:35:55", "remaining_time": "7:50:03", "throughput": 331.63, "total_tokens": 41305952} {"current_steps": 32620, "total_steps": 40000, "loss": 0.0614, "lr": 0.024506142999197938, "epoch": 1.5938484841081768, "percentage": 81.55, "elapsed_time": "1 day, 10:35:58", "remaining_time": "7:49:40", "throughput": 331.67, "total_tokens": 41312224} {"current_steps": 32625, "total_steps": 40000, "loss": 0.0561, "lr": 0.024473886067344002, "epoch": 1.594092785771871, "percentage": 81.56, "elapsed_time": "1 day, 10:36:01", "remaining_time": "7:49:17", "throughput": 331.71, "total_tokens": 41318176} {"current_steps": 32630, "total_steps": 40000, "loss": 0.066, "lr": 0.02444164849319434, "epoch": 1.5943370874355653, "percentage": 81.58, "elapsed_time": "1 day, 10:36:04", "remaining_time": "7:48:54", "throughput": 331.75, "total_tokens": 41324864} {"current_steps": 32635, "total_steps": 40000, "loss": 0.0216, "lr": 0.024409430281720306, "epoch": 1.5945813890992597, "percentage": 81.59, "elapsed_time": "1 day, 10:36:08", "remaining_time": "7:48:32", "throughput": 331.8, "total_tokens": 41331744} {"current_steps": 32640, "total_steps": 40000, "loss": 0.0362, "lr": 0.024377231437890428, "epoch": 1.594825690762954, "percentage": 81.6, "elapsed_time": "1 day, 10:36:11", "remaining_time": "7:48:09", "throughput": 331.84, "total_tokens": 41337984} {"current_steps": 32645, "total_steps": 40000, "loss": 0.0354, "lr": 0.024345051966670115, "epoch": 1.5950699924266485, "percentage": 81.61, "elapsed_time": "1 day, 10:36:14", "remaining_time": "7:47:46", "throughput": 331.88, "total_tokens": 41344192} {"current_steps": 32650, "total_steps": 40000, "loss": 0.0625, "lr": 0.024312891873021884, "epoch": 1.5953142940903429, "percentage": 81.62, "elapsed_time": "1 day, 10:36:17", "remaining_time": "7:47:24", "throughput": 331.92, "total_tokens": 41350112} {"current_steps": 32655, "total_steps": 40000, "loss": 0.0543, "lr": 0.024280751161905183, "epoch": 1.5955585957540372, "percentage": 81.64, "elapsed_time": "1 day, 10:36:20", "remaining_time": "7:47:01", "throughput": 331.97, "total_tokens": 41356320} {"current_steps": 32660, "total_steps": 40000, "loss": 0.0836, "lr": 0.02424862983827658, "epoch": 1.5958028974177314, "percentage": 81.65, "elapsed_time": "1 day, 10:36:23", "remaining_time": "7:46:38", "throughput": 332.01, "total_tokens": 41362816} {"current_steps": 32665, "total_steps": 40000, "loss": 0.0661, "lr": 0.024216527907089495, "epoch": 1.5960471990814258, "percentage": 81.66, "elapsed_time": "1 day, 10:36:26", "remaining_time": "7:46:16", "throughput": 332.05, "total_tokens": 41369088} {"current_steps": 32670, "total_steps": 40000, "loss": 0.0348, "lr": 0.024184445373294505, "epoch": 1.59629150074512, "percentage": 81.67, "elapsed_time": "1 day, 10:36:29", "remaining_time": "7:45:53", "throughput": 332.09, "total_tokens": 41375264} {"current_steps": 32675, "total_steps": 40000, "loss": 0.051, "lr": 0.02415238224183918, "epoch": 1.5965358024088143, "percentage": 81.69, "elapsed_time": "1 day, 10:36:32", "remaining_time": "7:45:30", "throughput": 332.13, "total_tokens": 41380768} {"current_steps": 32680, "total_steps": 40000, "loss": 0.0454, "lr": 0.024120338517667973, "epoch": 1.5967801040725087, "percentage": 81.7, "elapsed_time": "1 day, 10:36:35", "remaining_time": "7:45:08", "throughput": 332.17, "total_tokens": 41387296} {"current_steps": 32685, "total_steps": 40000, "loss": 0.0635, "lr": 0.02408831420572247, "epoch": 1.597024405736203, "percentage": 81.71, "elapsed_time": "1 day, 10:36:38", "remaining_time": "7:44:45", "throughput": 332.22, "total_tokens": 41393856} {"current_steps": 32690, "total_steps": 40000, "loss": 0.0607, "lr": 0.024056309310941264, "epoch": 1.5972687073998975, "percentage": 81.73, "elapsed_time": "1 day, 10:36:41", "remaining_time": "7:44:22", "throughput": 332.26, "total_tokens": 41400320} {"current_steps": 32695, "total_steps": 40000, "loss": 0.0573, "lr": 0.02402432383825982, "epoch": 1.5975130090635918, "percentage": 81.74, "elapsed_time": "1 day, 10:36:44", "remaining_time": "7:44:00", "throughput": 332.3, "total_tokens": 41406656} {"current_steps": 32700, "total_steps": 40000, "loss": 0.0574, "lr": 0.023992357792610792, "epoch": 1.5977573107272862, "percentage": 81.75, "elapsed_time": "1 day, 10:36:48", "remaining_time": "7:43:37", "throughput": 332.35, "total_tokens": 41413152} {"current_steps": 32705, "total_steps": 40000, "loss": 0.0687, "lr": 0.0239604111789237, "epoch": 1.5980016123909804, "percentage": 81.76, "elapsed_time": "1 day, 10:36:51", "remaining_time": "7:43:15", "throughput": 332.39, "total_tokens": 41419488} {"current_steps": 32710, "total_steps": 40000, "loss": 0.045, "lr": 0.023928484002125095, "epoch": 1.5982459140546748, "percentage": 81.77, "elapsed_time": "1 day, 10:36:54", "remaining_time": "7:42:52", "throughput": 332.43, "total_tokens": 41426048} {"current_steps": 32715, "total_steps": 40000, "loss": 0.0447, "lr": 0.023896576267138595, "epoch": 1.598490215718369, "percentage": 81.79, "elapsed_time": "1 day, 10:36:57", "remaining_time": "7:42:29", "throughput": 332.47, "total_tokens": 41432032} {"current_steps": 32720, "total_steps": 40000, "loss": 0.0663, "lr": 0.02386468797888471, "epoch": 1.5987345173820633, "percentage": 81.8, "elapsed_time": "1 day, 10:37:00", "remaining_time": "7:42:07", "throughput": 332.51, "total_tokens": 41437824} {"current_steps": 32725, "total_steps": 40000, "loss": 0.063, "lr": 0.023832819142281057, "epoch": 1.5989788190457577, "percentage": 81.81, "elapsed_time": "1 day, 10:37:03", "remaining_time": "7:41:44", "throughput": 332.55, "total_tokens": 41443840} {"current_steps": 32730, "total_steps": 40000, "loss": 0.0363, "lr": 0.02380096976224225, "epoch": 1.599223120709452, "percentage": 81.83, "elapsed_time": "1 day, 10:37:06", "remaining_time": "7:41:22", "throughput": 332.6, "total_tokens": 41450464} {"current_steps": 32735, "total_steps": 40000, "loss": 0.0419, "lr": 0.023769139843679777, "epoch": 1.5994674223731464, "percentage": 81.84, "elapsed_time": "1 day, 10:37:09", "remaining_time": "7:40:59", "throughput": 332.64, "total_tokens": 41456960} {"current_steps": 32740, "total_steps": 40000, "loss": 0.0216, "lr": 0.023737329391502287, "epoch": 1.5997117240368408, "percentage": 81.85, "elapsed_time": "1 day, 10:37:12", "remaining_time": "7:40:36", "throughput": 332.69, "total_tokens": 41463424} {"current_steps": 32745, "total_steps": 40000, "loss": 0.0807, "lr": 0.023705538410615293, "epoch": 1.599956025700535, "percentage": 81.86, "elapsed_time": "1 day, 10:37:15", "remaining_time": "7:40:14", "throughput": 332.73, "total_tokens": 41470208} {"current_steps": 32750, "total_steps": 40000, "loss": 0.0242, "lr": 0.023673766905921396, "epoch": 1.6002003273642293, "percentage": 81.88, "elapsed_time": "1 day, 10:37:18", "remaining_time": "7:39:51", "throughput": 332.77, "total_tokens": 41476640} {"current_steps": 32755, "total_steps": 40000, "loss": 0.0821, "lr": 0.0236420148823202, "epoch": 1.6004446290279237, "percentage": 81.89, "elapsed_time": "1 day, 10:37:21", "remaining_time": "7:39:29", "throughput": 332.82, "total_tokens": 41483264} {"current_steps": 32760, "total_steps": 40000, "loss": 0.1028, "lr": 0.02361028234470816, "epoch": 1.6006889306916179, "percentage": 81.9, "elapsed_time": "1 day, 10:37:24", "remaining_time": "7:39:06", "throughput": 332.86, "total_tokens": 41489504} {"current_steps": 32765, "total_steps": 40000, "loss": 0.0716, "lr": 0.023578569297978913, "epoch": 1.6009332323553123, "percentage": 81.91, "elapsed_time": "1 day, 10:37:27", "remaining_time": "7:38:44", "throughput": 332.9, "total_tokens": 41495648} {"current_steps": 32770, "total_steps": 40000, "loss": 0.0869, "lr": 0.023546875747023025, "epoch": 1.6011775340190066, "percentage": 81.92, "elapsed_time": "1 day, 10:37:31", "remaining_time": "7:38:21", "throughput": 332.95, "total_tokens": 41502304} {"current_steps": 32775, "total_steps": 40000, "loss": 0.0483, "lr": 0.02351520169672801, "epoch": 1.601421835682701, "percentage": 81.94, "elapsed_time": "1 day, 10:37:34", "remaining_time": "7:37:59", "throughput": 332.99, "total_tokens": 41508608} {"current_steps": 32780, "total_steps": 40000, "loss": 0.0311, "lr": 0.023483547151978357, "epoch": 1.6016661373463954, "percentage": 81.95, "elapsed_time": "1 day, 10:37:37", "remaining_time": "7:37:36", "throughput": 333.03, "total_tokens": 41514848} {"current_steps": 32785, "total_steps": 40000, "loss": 0.0405, "lr": 0.023451912117655675, "epoch": 1.6019104390100898, "percentage": 81.96, "elapsed_time": "1 day, 10:37:40", "remaining_time": "7:37:13", "throughput": 333.08, "total_tokens": 41521280} {"current_steps": 32790, "total_steps": 40000, "loss": 0.0403, "lr": 0.023420296598638417, "epoch": 1.602154740673784, "percentage": 81.97, "elapsed_time": "1 day, 10:37:43", "remaining_time": "7:36:51", "throughput": 333.12, "total_tokens": 41528480} {"current_steps": 32795, "total_steps": 40000, "loss": 0.0592, "lr": 0.023388700599802165, "epoch": 1.6023990423374783, "percentage": 81.99, "elapsed_time": "1 day, 10:37:46", "remaining_time": "7:36:29", "throughput": 333.17, "total_tokens": 41535072} {"current_steps": 32800, "total_steps": 40000, "loss": 0.0431, "lr": 0.023357124126019334, "epoch": 1.6026433440011727, "percentage": 82.0, "elapsed_time": "1 day, 10:37:49", "remaining_time": "7:36:06", "throughput": 333.21, "total_tokens": 41541664} {"current_steps": 32800, "total_steps": 40000, "eval_loss": 0.06186993792653084, "epoch": 1.6026433440011727, "percentage": 82.0, "elapsed_time": "1 day, 10:48:23", "remaining_time": "7:38:25", "throughput": 331.53, "total_tokens": 41541664} {"current_steps": 32805, "total_steps": 40000, "loss": 0.0761, "lr": 0.02332556718215945, "epoch": 1.6028876456648669, "percentage": 82.01, "elapsed_time": "1 day, 10:48:27", "remaining_time": "7:38:03", "throughput": 331.57, "total_tokens": 41547808} {"current_steps": 32810, "total_steps": 40000, "loss": 0.0508, "lr": 0.023294029773089035, "epoch": 1.6031319473285612, "percentage": 82.03, "elapsed_time": "1 day, 10:48:30", "remaining_time": "7:37:40", "throughput": 331.61, "total_tokens": 41554176} {"current_steps": 32815, "total_steps": 40000, "loss": 0.0231, "lr": 0.023262511903671484, "epoch": 1.6033762489922556, "percentage": 82.04, "elapsed_time": "1 day, 10:48:33", "remaining_time": "7:37:18", "throughput": 331.65, "total_tokens": 41560640} {"current_steps": 32820, "total_steps": 40000, "loss": 0.0816, "lr": 0.023231013578767324, "epoch": 1.60362055065595, "percentage": 82.05, "elapsed_time": "1 day, 10:48:37", "remaining_time": "7:36:55", "throughput": 331.7, "total_tokens": 41567072} {"current_steps": 32825, "total_steps": 40000, "loss": 0.0321, "lr": 0.0231995348032339, "epoch": 1.6038648523196444, "percentage": 82.06, "elapsed_time": "1 day, 10:48:40", "remaining_time": "7:36:32", "throughput": 331.74, "total_tokens": 41573504} {"current_steps": 32830, "total_steps": 40000, "loss": 0.0705, "lr": 0.023168075581925685, "epoch": 1.6041091539833388, "percentage": 82.08, "elapsed_time": "1 day, 10:48:43", "remaining_time": "7:36:10", "throughput": 331.78, "total_tokens": 41579968} {"current_steps": 32835, "total_steps": 40000, "loss": 0.0567, "lr": 0.023136635919694126, "epoch": 1.604353455647033, "percentage": 82.09, "elapsed_time": "1 day, 10:48:46", "remaining_time": "7:35:47", "throughput": 331.83, "total_tokens": 41586528} {"current_steps": 32840, "total_steps": 40000, "loss": 0.0709, "lr": 0.02310521582138753, "epoch": 1.6045977573107273, "percentage": 82.1, "elapsed_time": "1 day, 10:48:49", "remaining_time": "7:35:25", "throughput": 331.87, "total_tokens": 41593248} {"current_steps": 32845, "total_steps": 40000, "loss": 0.0655, "lr": 0.023073815291851357, "epoch": 1.6048420589744217, "percentage": 82.11, "elapsed_time": "1 day, 10:48:52", "remaining_time": "7:35:02", "throughput": 331.91, "total_tokens": 41599040} {"current_steps": 32850, "total_steps": 40000, "loss": 0.0282, "lr": 0.02304243433592788, "epoch": 1.6050863606381158, "percentage": 82.12, "elapsed_time": "1 day, 10:48:55", "remaining_time": "7:34:40", "throughput": 331.95, "total_tokens": 41605184} {"current_steps": 32855, "total_steps": 40000, "loss": 0.062, "lr": 0.023011072958456513, "epoch": 1.6053306623018102, "percentage": 82.14, "elapsed_time": "1 day, 10:48:58", "remaining_time": "7:34:17", "throughput": 331.99, "total_tokens": 41611488} {"current_steps": 32860, "total_steps": 40000, "loss": 0.0643, "lr": 0.022979731164273536, "epoch": 1.6055749639655046, "percentage": 82.15, "elapsed_time": "1 day, 10:49:01", "remaining_time": "7:33:54", "throughput": 332.04, "total_tokens": 41618080} {"current_steps": 32865, "total_steps": 40000, "loss": 0.0632, "lr": 0.022948408958212218, "epoch": 1.605819265629199, "percentage": 82.16, "elapsed_time": "1 day, 10:49:04", "remaining_time": "7:33:32", "throughput": 332.08, "total_tokens": 41624096} {"current_steps": 32870, "total_steps": 40000, "loss": 0.0549, "lr": 0.022917106345102876, "epoch": 1.6060635672928933, "percentage": 82.17, "elapsed_time": "1 day, 10:49:07", "remaining_time": "7:33:09", "throughput": 332.12, "total_tokens": 41630016} {"current_steps": 32875, "total_steps": 40000, "loss": 0.0727, "lr": 0.022885823329772785, "epoch": 1.6063078689565877, "percentage": 82.19, "elapsed_time": "1 day, 10:49:10", "remaining_time": "7:32:47", "throughput": 332.16, "total_tokens": 41636288} {"current_steps": 32880, "total_steps": 40000, "loss": 0.0414, "lr": 0.02285455991704612, "epoch": 1.6065521706202819, "percentage": 82.2, "elapsed_time": "1 day, 10:49:13", "remaining_time": "7:32:24", "throughput": 332.2, "total_tokens": 41642240} {"current_steps": 32885, "total_steps": 40000, "loss": 0.0479, "lr": 0.022823316111744117, "epoch": 1.6067964722839763, "percentage": 82.21, "elapsed_time": "1 day, 10:49:16", "remaining_time": "7:32:02", "throughput": 332.24, "total_tokens": 41648192} {"current_steps": 32890, "total_steps": 40000, "loss": 0.0615, "lr": 0.022792091918685014, "epoch": 1.6070407739476704, "percentage": 82.23, "elapsed_time": "1 day, 10:49:19", "remaining_time": "7:31:39", "throughput": 332.28, "total_tokens": 41654336} {"current_steps": 32895, "total_steps": 40000, "loss": 0.0582, "lr": 0.022760887342683906, "epoch": 1.6072850756113648, "percentage": 82.24, "elapsed_time": "1 day, 10:49:22", "remaining_time": "7:31:17", "throughput": 332.32, "total_tokens": 41660512} {"current_steps": 32900, "total_steps": 40000, "loss": 0.0902, "lr": 0.022729702388552975, "epoch": 1.6075293772750592, "percentage": 82.25, "elapsed_time": "1 day, 10:49:25", "remaining_time": "7:30:54", "throughput": 332.36, "total_tokens": 41667136} {"current_steps": 32905, "total_steps": 40000, "loss": 0.0598, "lr": 0.022698537061101292, "epoch": 1.6077736789387536, "percentage": 82.26, "elapsed_time": "1 day, 10:49:29", "remaining_time": "7:30:32", "throughput": 332.41, "total_tokens": 41673856} {"current_steps": 32910, "total_steps": 40000, "loss": 0.0642, "lr": 0.022667391365134962, "epoch": 1.608017980602448, "percentage": 82.27, "elapsed_time": "1 day, 10:49:32", "remaining_time": "7:30:09", "throughput": 332.45, "total_tokens": 41680128} {"current_steps": 32915, "total_steps": 40000, "loss": 0.0504, "lr": 0.022636265305457065, "epoch": 1.6082622822661423, "percentage": 82.29, "elapsed_time": "1 day, 10:49:35", "remaining_time": "7:29:47", "throughput": 332.5, "total_tokens": 41686656} {"current_steps": 32920, "total_steps": 40000, "loss": 0.062, "lr": 0.02260515888686764, "epoch": 1.6085065839298367, "percentage": 82.3, "elapsed_time": "1 day, 10:49:38", "remaining_time": "7:29:24", "throughput": 332.54, "total_tokens": 41692864} {"current_steps": 32925, "total_steps": 40000, "loss": 0.0386, "lr": 0.022574072114163596, "epoch": 1.6087508855935309, "percentage": 82.31, "elapsed_time": "1 day, 10:49:41", "remaining_time": "7:29:02", "throughput": 332.58, "total_tokens": 41699392} {"current_steps": 32930, "total_steps": 40000, "loss": 0.0498, "lr": 0.022543004992139005, "epoch": 1.6089951872572252, "percentage": 82.33, "elapsed_time": "1 day, 10:49:44", "remaining_time": "7:28:39", "throughput": 332.62, "total_tokens": 41705760} {"current_steps": 32935, "total_steps": 40000, "loss": 0.0773, "lr": 0.022511957525584745, "epoch": 1.6092394889209194, "percentage": 82.34, "elapsed_time": "1 day, 10:49:47", "remaining_time": "7:28:17", "throughput": 332.66, "total_tokens": 41711840} {"current_steps": 32940, "total_steps": 40000, "loss": 0.0628, "lr": 0.022480929719288778, "epoch": 1.6094837905846138, "percentage": 82.35, "elapsed_time": "1 day, 10:49:50", "remaining_time": "7:27:54", "throughput": 332.7, "total_tokens": 41717984} {"current_steps": 32945, "total_steps": 40000, "loss": 0.0464, "lr": 0.02244992157803592, "epoch": 1.6097280922483082, "percentage": 82.36, "elapsed_time": "1 day, 10:49:53", "remaining_time": "7:27:32", "throughput": 332.74, "total_tokens": 41724032} {"current_steps": 32950, "total_steps": 40000, "loss": 0.0562, "lr": 0.022418933106608047, "epoch": 1.6099723939120025, "percentage": 82.38, "elapsed_time": "1 day, 10:49:56", "remaining_time": "7:27:09", "throughput": 332.79, "total_tokens": 41730720} {"current_steps": 32955, "total_steps": 40000, "loss": 0.0584, "lr": 0.022387964309784018, "epoch": 1.610216695575697, "percentage": 82.39, "elapsed_time": "1 day, 10:49:59", "remaining_time": "7:26:47", "throughput": 332.83, "total_tokens": 41737184} {"current_steps": 32960, "total_steps": 40000, "loss": 0.0614, "lr": 0.022357015192339517, "epoch": 1.6104609972393913, "percentage": 82.4, "elapsed_time": "1 day, 10:50:02", "remaining_time": "7:26:25", "throughput": 332.88, "total_tokens": 41743488} {"current_steps": 32965, "total_steps": 40000, "loss": 0.061, "lr": 0.02232608575904734, "epoch": 1.6107052989030857, "percentage": 82.41, "elapsed_time": "1 day, 10:50:05", "remaining_time": "7:26:02", "throughput": 332.92, "total_tokens": 41749952} {"current_steps": 32970, "total_steps": 40000, "loss": 0.0449, "lr": 0.022295176014677225, "epoch": 1.6109496005667798, "percentage": 82.42, "elapsed_time": "1 day, 10:50:08", "remaining_time": "7:25:40", "throughput": 332.96, "total_tokens": 41755968} {"current_steps": 32975, "total_steps": 40000, "loss": 0.0584, "lr": 0.02226428596399577, "epoch": 1.6111939022304742, "percentage": 82.44, "elapsed_time": "1 day, 10:50:12", "remaining_time": "7:25:17", "throughput": 333.0, "total_tokens": 41762336} {"current_steps": 32980, "total_steps": 40000, "loss": 0.0523, "lr": 0.02223341561176669, "epoch": 1.6114382038941684, "percentage": 82.45, "elapsed_time": "1 day, 10:50:15", "remaining_time": "7:24:55", "throughput": 333.04, "total_tokens": 41768320} {"current_steps": 32985, "total_steps": 40000, "loss": 0.049, "lr": 0.0222025649627505, "epoch": 1.6116825055578627, "percentage": 82.46, "elapsed_time": "1 day, 10:50:18", "remaining_time": "7:24:32", "throughput": 333.08, "total_tokens": 41774624} {"current_steps": 32990, "total_steps": 40000, "loss": 0.0581, "lr": 0.022171734021704814, "epoch": 1.6119268072215571, "percentage": 82.47, "elapsed_time": "1 day, 10:50:21", "remaining_time": "7:24:10", "throughput": 333.12, "total_tokens": 41780800} {"current_steps": 32995, "total_steps": 40000, "loss": 0.0415, "lr": 0.022140922793384116, "epoch": 1.6121711088852515, "percentage": 82.49, "elapsed_time": "1 day, 10:50:24", "remaining_time": "7:23:48", "throughput": 333.17, "total_tokens": 41787264} {"current_steps": 33000, "total_steps": 40000, "loss": 0.087, "lr": 0.022110131282539934, "epoch": 1.6124154105489459, "percentage": 82.5, "elapsed_time": "1 day, 10:50:27", "remaining_time": "7:23:25", "throughput": 333.21, "total_tokens": 41793376} {"current_steps": 33000, "total_steps": 40000, "eval_loss": 0.06099846214056015, "epoch": 1.6124154105489459, "percentage": 82.5, "elapsed_time": "1 day, 11:01:00", "remaining_time": "7:25:40", "throughput": 331.53, "total_tokens": 41793376} {"current_steps": 33005, "total_steps": 40000, "loss": 0.0586, "lr": 0.022079359493920675, "epoch": 1.6126597122126403, "percentage": 82.51, "elapsed_time": "1 day, 11:01:04", "remaining_time": "7:25:17", "throughput": 331.58, "total_tokens": 41800192} {"current_steps": 33010, "total_steps": 40000, "loss": 0.0318, "lr": 0.02204860743227169, "epoch": 1.6129040138763346, "percentage": 82.53, "elapsed_time": "1 day, 11:01:07", "remaining_time": "7:24:55", "throughput": 331.61, "total_tokens": 41805984} {"current_steps": 33015, "total_steps": 40000, "loss": 0.055, "lr": 0.022017875102335365, "epoch": 1.6131483155400288, "percentage": 82.54, "elapsed_time": "1 day, 11:01:10", "remaining_time": "7:24:32", "throughput": 331.66, "total_tokens": 41812256} {"current_steps": 33020, "total_steps": 40000, "loss": 0.0485, "lr": 0.02198716250885108, "epoch": 1.6133926172037232, "percentage": 82.55, "elapsed_time": "1 day, 11:01:14", "remaining_time": "7:24:10", "throughput": 331.7, "total_tokens": 41818720} {"current_steps": 33025, "total_steps": 40000, "loss": 0.0433, "lr": 0.021956469656555, "epoch": 1.6136369188674173, "percentage": 82.56, "elapsed_time": "1 day, 11:01:17", "remaining_time": "7:23:47", "throughput": 331.74, "total_tokens": 41825184} {"current_steps": 33030, "total_steps": 40000, "loss": 0.0754, "lr": 0.0219257965501804, "epoch": 1.6138812205311117, "percentage": 82.58, "elapsed_time": "1 day, 11:01:20", "remaining_time": "7:23:25", "throughput": 331.78, "total_tokens": 41831232} {"current_steps": 33035, "total_steps": 40000, "loss": 0.0515, "lr": 0.021895143194457494, "epoch": 1.614125522194806, "percentage": 82.59, "elapsed_time": "1 day, 11:01:23", "remaining_time": "7:23:03", "throughput": 331.83, "total_tokens": 41837824} {"current_steps": 33040, "total_steps": 40000, "loss": 0.031, "lr": 0.021864509594113322, "epoch": 1.6143698238585005, "percentage": 82.6, "elapsed_time": "1 day, 11:01:26", "remaining_time": "7:22:40", "throughput": 331.87, "total_tokens": 41844160} {"current_steps": 33045, "total_steps": 40000, "loss": 0.0479, "lr": 0.02183389575387207, "epoch": 1.6146141255221949, "percentage": 82.61, "elapsed_time": "1 day, 11:01:29", "remaining_time": "7:22:18", "throughput": 331.91, "total_tokens": 41851008} {"current_steps": 33050, "total_steps": 40000, "loss": 0.0547, "lr": 0.021803301678454682, "epoch": 1.6148584271858892, "percentage": 82.62, "elapsed_time": "1 day, 11:01:32", "remaining_time": "7:21:55", "throughput": 331.96, "total_tokens": 41857184} {"current_steps": 33055, "total_steps": 40000, "loss": 0.0756, "lr": 0.021772727372579213, "epoch": 1.6151027288495836, "percentage": 82.64, "elapsed_time": "1 day, 11:01:35", "remaining_time": "7:21:33", "throughput": 331.99, "total_tokens": 41863072} {"current_steps": 33060, "total_steps": 40000, "loss": 0.06, "lr": 0.02174217284096061, "epoch": 1.6153470305132778, "percentage": 82.65, "elapsed_time": "1 day, 11:01:38", "remaining_time": "7:21:10", "throughput": 332.04, "total_tokens": 41869600} {"current_steps": 33065, "total_steps": 40000, "loss": 0.0612, "lr": 0.0217116380883107, "epoch": 1.6155913321769722, "percentage": 82.66, "elapsed_time": "1 day, 11:01:41", "remaining_time": "7:20:48", "throughput": 332.08, "total_tokens": 41875840} {"current_steps": 33070, "total_steps": 40000, "loss": 0.0579, "lr": 0.021681123119338425, "epoch": 1.6158356338406663, "percentage": 82.67, "elapsed_time": "1 day, 11:01:44", "remaining_time": "7:20:25", "throughput": 332.12, "total_tokens": 41881888} {"current_steps": 33075, "total_steps": 40000, "loss": 0.0754, "lr": 0.02165062793874951, "epoch": 1.6160799355043607, "percentage": 82.69, "elapsed_time": "1 day, 11:01:47", "remaining_time": "7:20:03", "throughput": 332.16, "total_tokens": 41887712} {"current_steps": 33080, "total_steps": 40000, "loss": 0.0561, "lr": 0.021620152551246666, "epoch": 1.616324237168055, "percentage": 82.7, "elapsed_time": "1 day, 11:01:50", "remaining_time": "7:19:41", "throughput": 332.2, "total_tokens": 41894208} {"current_steps": 33085, "total_steps": 40000, "loss": 0.0373, "lr": 0.02158969696152967, "epoch": 1.6165685388317494, "percentage": 82.71, "elapsed_time": "1 day, 11:01:53", "remaining_time": "7:19:18", "throughput": 332.24, "total_tokens": 41900608} {"current_steps": 33090, "total_steps": 40000, "loss": 0.0462, "lr": 0.021559261174295057, "epoch": 1.6168128404954438, "percentage": 82.73, "elapsed_time": "1 day, 11:01:56", "remaining_time": "7:18:56", "throughput": 332.28, "total_tokens": 41906656} {"current_steps": 33095, "total_steps": 40000, "loss": 0.0399, "lr": 0.02152884519423646, "epoch": 1.6170571421591382, "percentage": 82.74, "elapsed_time": "1 day, 11:01:59", "remaining_time": "7:18:33", "throughput": 332.33, "total_tokens": 41913120} {"current_steps": 33100, "total_steps": 40000, "loss": 0.0491, "lr": 0.021498449026044447, "epoch": 1.6173014438228326, "percentage": 82.75, "elapsed_time": "1 day, 11:02:03", "remaining_time": "7:18:11", "throughput": 332.37, "total_tokens": 41919904} {"current_steps": 33105, "total_steps": 40000, "loss": 0.0977, "lr": 0.021468072674406414, "epoch": 1.6175457454865267, "percentage": 82.76, "elapsed_time": "1 day, 11:02:06", "remaining_time": "7:17:49", "throughput": 332.41, "total_tokens": 41926016} {"current_steps": 33110, "total_steps": 40000, "loss": 0.0403, "lr": 0.021437716144006795, "epoch": 1.6177900471502211, "percentage": 82.78, "elapsed_time": "1 day, 11:02:09", "remaining_time": "7:17:26", "throughput": 332.46, "total_tokens": 41932640} {"current_steps": 33115, "total_steps": 40000, "loss": 0.0493, "lr": 0.021407379439527002, "epoch": 1.6180343488139153, "percentage": 82.79, "elapsed_time": "1 day, 11:02:12", "remaining_time": "7:17:04", "throughput": 332.5, "total_tokens": 41938688} {"current_steps": 33120, "total_steps": 40000, "loss": 0.0388, "lr": 0.021377062565645255, "epoch": 1.6182786504776097, "percentage": 82.8, "elapsed_time": "1 day, 11:02:15", "remaining_time": "7:16:42", "throughput": 332.54, "total_tokens": 41945312} {"current_steps": 33125, "total_steps": 40000, "loss": 0.038, "lr": 0.02134676552703688, "epoch": 1.618522952141304, "percentage": 82.81, "elapsed_time": "1 day, 11:02:18", "remaining_time": "7:16:19", "throughput": 332.58, "total_tokens": 41951584} {"current_steps": 33130, "total_steps": 40000, "loss": 0.0295, "lr": 0.02131648832837398, "epoch": 1.6187672538049984, "percentage": 82.83, "elapsed_time": "1 day, 11:02:21", "remaining_time": "7:15:57", "throughput": 332.62, "total_tokens": 41957248} {"current_steps": 33135, "total_steps": 40000, "loss": 0.0541, "lr": 0.02128623097432574, "epoch": 1.6190115554686928, "percentage": 82.84, "elapsed_time": "1 day, 11:02:24", "remaining_time": "7:15:34", "throughput": 332.66, "total_tokens": 41963424} {"current_steps": 33140, "total_steps": 40000, "loss": 0.0737, "lr": 0.021255993469558192, "epoch": 1.6192558571323872, "percentage": 82.85, "elapsed_time": "1 day, 11:02:27", "remaining_time": "7:15:12", "throughput": 332.7, "total_tokens": 41969760} {"current_steps": 33145, "total_steps": 40000, "loss": 0.0629, "lr": 0.021225775818734364, "epoch": 1.6195001587960816, "percentage": 82.86, "elapsed_time": "1 day, 11:02:30", "remaining_time": "7:14:50", "throughput": 332.74, "total_tokens": 41975808} {"current_steps": 33150, "total_steps": 40000, "loss": 0.0408, "lr": 0.021195578026514166, "epoch": 1.6197444604597757, "percentage": 82.88, "elapsed_time": "1 day, 11:02:33", "remaining_time": "7:14:27", "throughput": 332.78, "total_tokens": 41981856} {"current_steps": 33155, "total_steps": 40000, "loss": 0.0774, "lr": 0.02116540009755452, "epoch": 1.61998876212347, "percentage": 82.89, "elapsed_time": "1 day, 11:02:36", "remaining_time": "7:14:05", "throughput": 332.83, "total_tokens": 41988352} {"current_steps": 33160, "total_steps": 40000, "loss": 0.0561, "lr": 0.021135242036509173, "epoch": 1.6202330637871643, "percentage": 82.9, "elapsed_time": "1 day, 11:02:39", "remaining_time": "7:13:43", "throughput": 332.87, "total_tokens": 41994784} {"current_steps": 33165, "total_steps": 40000, "loss": 0.0593, "lr": 0.021105103848028967, "epoch": 1.6204773654508586, "percentage": 82.91, "elapsed_time": "1 day, 11:02:42", "remaining_time": "7:13:20", "throughput": 332.91, "total_tokens": 42000896} {"current_steps": 33170, "total_steps": 40000, "loss": 0.0474, "lr": 0.021074985536761504, "epoch": 1.620721667114553, "percentage": 82.93, "elapsed_time": "1 day, 11:02:45", "remaining_time": "7:12:58", "throughput": 332.95, "total_tokens": 42006848} {"current_steps": 33175, "total_steps": 40000, "loss": 0.057, "lr": 0.021044887107351435, "epoch": 1.6209659687782474, "percentage": 82.94, "elapsed_time": "1 day, 11:02:48", "remaining_time": "7:12:36", "throughput": 332.99, "total_tokens": 42012864} {"current_steps": 33180, "total_steps": 40000, "loss": 0.0787, "lr": 0.021014808564440362, "epoch": 1.6212102704419418, "percentage": 82.95, "elapsed_time": "1 day, 11:02:51", "remaining_time": "7:12:14", "throughput": 333.03, "total_tokens": 42019072} {"current_steps": 33185, "total_steps": 40000, "loss": 0.0467, "lr": 0.02098474991266671, "epoch": 1.6214545721056361, "percentage": 82.96, "elapsed_time": "1 day, 11:02:54", "remaining_time": "7:11:51", "throughput": 333.07, "total_tokens": 42025504} {"current_steps": 33190, "total_steps": 40000, "loss": 0.0563, "lr": 0.02095471115666592, "epoch": 1.6216988737693305, "percentage": 82.97, "elapsed_time": "1 day, 11:02:57", "remaining_time": "7:11:29", "throughput": 333.11, "total_tokens": 42031712} {"current_steps": 33195, "total_steps": 40000, "loss": 0.097, "lr": 0.020924692301070406, "epoch": 1.6219431754330247, "percentage": 82.99, "elapsed_time": "1 day, 11:03:00", "remaining_time": "7:11:07", "throughput": 333.16, "total_tokens": 42038016} {"current_steps": 33200, "total_steps": 40000, "loss": 0.0538, "lr": 0.020894693350509346, "epoch": 1.622187477096719, "percentage": 83.0, "elapsed_time": "1 day, 11:03:04", "remaining_time": "7:10:44", "throughput": 333.2, "total_tokens": 42044352} {"current_steps": 33200, "total_steps": 40000, "eval_loss": 0.061745792627334595, "epoch": 1.622187477096719, "percentage": 83.0, "elapsed_time": "1 day, 11:13:37", "remaining_time": "7:12:54", "throughput": 331.53, "total_tokens": 42044352} {"current_steps": 33205, "total_steps": 40000, "loss": 0.0369, "lr": 0.020864714309609057, "epoch": 1.6224317787604132, "percentage": 83.01, "elapsed_time": "1 day, 11:13:41", "remaining_time": "7:12:32", "throughput": 331.57, "total_tokens": 42050336} {"current_steps": 33210, "total_steps": 40000, "loss": 0.0663, "lr": 0.020834755182992604, "epoch": 1.6226760804241076, "percentage": 83.03, "elapsed_time": "1 day, 11:13:44", "remaining_time": "7:12:10", "throughput": 331.61, "total_tokens": 42056384} {"current_steps": 33215, "total_steps": 40000, "loss": 0.0677, "lr": 0.02080481597528011, "epoch": 1.622920382087802, "percentage": 83.04, "elapsed_time": "1 day, 11:13:47", "remaining_time": "7:11:47", "throughput": 331.65, "total_tokens": 42062720} {"current_steps": 33220, "total_steps": 40000, "loss": 0.0524, "lr": 0.020774896691088583, "epoch": 1.6231646837514964, "percentage": 83.05, "elapsed_time": "1 day, 11:13:50", "remaining_time": "7:11:25", "throughput": 331.7, "total_tokens": 42069280} {"current_steps": 33225, "total_steps": 40000, "loss": 0.069, "lr": 0.020744997335031882, "epoch": 1.6234089854151907, "percentage": 83.06, "elapsed_time": "1 day, 11:13:53", "remaining_time": "7:11:03", "throughput": 331.74, "total_tokens": 42075552} {"current_steps": 33230, "total_steps": 40000, "loss": 0.0343, "lr": 0.02071511791172092, "epoch": 1.6236532870788851, "percentage": 83.08, "elapsed_time": "1 day, 11:13:57", "remaining_time": "7:10:40", "throughput": 331.78, "total_tokens": 42082240} {"current_steps": 33235, "total_steps": 40000, "loss": 0.0563, "lr": 0.02068525842576351, "epoch": 1.6238975887425795, "percentage": 83.09, "elapsed_time": "1 day, 11:14:00", "remaining_time": "7:10:18", "throughput": 331.82, "total_tokens": 42088192} {"current_steps": 33240, "total_steps": 40000, "loss": 0.0793, "lr": 0.020655418881764264, "epoch": 1.6241418904062737, "percentage": 83.1, "elapsed_time": "1 day, 11:14:03", "remaining_time": "7:09:56", "throughput": 331.86, "total_tokens": 42094592} {"current_steps": 33245, "total_steps": 40000, "loss": 0.0626, "lr": 0.020625599284324923, "epoch": 1.624386192069968, "percentage": 83.11, "elapsed_time": "1 day, 11:14:06", "remaining_time": "7:09:33", "throughput": 331.9, "total_tokens": 42100512} {"current_steps": 33250, "total_steps": 40000, "loss": 0.0229, "lr": 0.02059579963804396, "epoch": 1.6246304937336622, "percentage": 83.12, "elapsed_time": "1 day, 11:14:09", "remaining_time": "7:09:11", "throughput": 331.95, "total_tokens": 42106976} {"current_steps": 33255, "total_steps": 40000, "loss": 0.0563, "lr": 0.02056601994751688, "epoch": 1.6248747953973566, "percentage": 83.14, "elapsed_time": "1 day, 11:14:12", "remaining_time": "7:08:49", "throughput": 331.99, "total_tokens": 42113152} {"current_steps": 33260, "total_steps": 40000, "loss": 0.0542, "lr": 0.02053626021733614, "epoch": 1.625119097061051, "percentage": 83.15, "elapsed_time": "1 day, 11:14:15", "remaining_time": "7:08:26", "throughput": 332.03, "total_tokens": 42119392} {"current_steps": 33265, "total_steps": 40000, "loss": 0.068, "lr": 0.02050652045209097, "epoch": 1.6253633987247453, "percentage": 83.16, "elapsed_time": "1 day, 11:14:18", "remaining_time": "7:08:04", "throughput": 332.07, "total_tokens": 42125536} {"current_steps": 33270, "total_steps": 40000, "loss": 0.0431, "lr": 0.020476800656367672, "epoch": 1.6256077003884397, "percentage": 83.17, "elapsed_time": "1 day, 11:14:21", "remaining_time": "7:07:42", "throughput": 332.11, "total_tokens": 42131648} {"current_steps": 33275, "total_steps": 40000, "loss": 0.042, "lr": 0.020447100834749425, "epoch": 1.625852002052134, "percentage": 83.19, "elapsed_time": "1 day, 11:14:24", "remaining_time": "7:07:19", "throughput": 332.15, "total_tokens": 42137504} {"current_steps": 33280, "total_steps": 40000, "loss": 0.0436, "lr": 0.02041742099181627, "epoch": 1.6260963037158283, "percentage": 83.2, "elapsed_time": "1 day, 11:14:27", "remaining_time": "7:06:57", "throughput": 332.19, "total_tokens": 42143968} {"current_steps": 33285, "total_steps": 40000, "loss": 0.0744, "lr": 0.02038776113214526, "epoch": 1.6263406053795226, "percentage": 83.21, "elapsed_time": "1 day, 11:14:30", "remaining_time": "7:06:35", "throughput": 332.23, "total_tokens": 42150272} {"current_steps": 33290, "total_steps": 40000, "loss": 0.0612, "lr": 0.0203581212603103, "epoch": 1.626584907043217, "percentage": 83.23, "elapsed_time": "1 day, 11:14:33", "remaining_time": "7:06:12", "throughput": 332.27, "total_tokens": 42156800} {"current_steps": 33295, "total_steps": 40000, "loss": 0.042, "lr": 0.02032850138088219, "epoch": 1.6268292087069112, "percentage": 83.24, "elapsed_time": "1 day, 11:14:36", "remaining_time": "7:05:50", "throughput": 332.32, "total_tokens": 42163264} {"current_steps": 33300, "total_steps": 40000, "loss": 0.0425, "lr": 0.020298901498428754, "epoch": 1.6270735103706055, "percentage": 83.25, "elapsed_time": "1 day, 11:14:39", "remaining_time": "7:05:28", "throughput": 332.36, "total_tokens": 42169440} {"current_steps": 33305, "total_steps": 40000, "loss": 0.0669, "lr": 0.020269321617514595, "epoch": 1.6273178120343, "percentage": 83.26, "elapsed_time": "1 day, 11:14:42", "remaining_time": "7:05:06", "throughput": 332.4, "total_tokens": 42175712} {"current_steps": 33310, "total_steps": 40000, "loss": 0.0375, "lr": 0.020239761742701343, "epoch": 1.6275621136979943, "percentage": 83.28, "elapsed_time": "1 day, 11:14:45", "remaining_time": "7:04:43", "throughput": 332.44, "total_tokens": 42181536} {"current_steps": 33315, "total_steps": 40000, "loss": 0.0558, "lr": 0.02021022187854754, "epoch": 1.6278064153616887, "percentage": 83.29, "elapsed_time": "1 day, 11:14:48", "remaining_time": "7:04:21", "throughput": 332.48, "total_tokens": 42187776} {"current_steps": 33320, "total_steps": 40000, "loss": 0.0305, "lr": 0.020180702029608522, "epoch": 1.628050717025383, "percentage": 83.3, "elapsed_time": "1 day, 11:14:52", "remaining_time": "7:03:59", "throughput": 332.52, "total_tokens": 42194496} {"current_steps": 33325, "total_steps": 40000, "loss": 0.0403, "lr": 0.020151202200436695, "epoch": 1.6282950186890772, "percentage": 83.31, "elapsed_time": "1 day, 11:14:55", "remaining_time": "7:03:37", "throughput": 332.56, "total_tokens": 42200544} {"current_steps": 33330, "total_steps": 40000, "loss": 0.0581, "lr": 0.020121722395581226, "epoch": 1.6285393203527716, "percentage": 83.33, "elapsed_time": "1 day, 11:14:58", "remaining_time": "7:03:14", "throughput": 332.61, "total_tokens": 42207232} {"current_steps": 33335, "total_steps": 40000, "loss": 0.0349, "lr": 0.020092262619588342, "epoch": 1.628783622016466, "percentage": 83.34, "elapsed_time": "1 day, 11:15:01", "remaining_time": "7:02:52", "throughput": 332.65, "total_tokens": 42213440} {"current_steps": 33340, "total_steps": 40000, "loss": 0.0437, "lr": 0.02006282287700109, "epoch": 1.6290279236801601, "percentage": 83.35, "elapsed_time": "1 day, 11:15:04", "remaining_time": "7:02:30", "throughput": 332.69, "total_tokens": 42219872} {"current_steps": 33345, "total_steps": 40000, "loss": 0.0531, "lr": 0.020033403172359427, "epoch": 1.6292722253438545, "percentage": 83.36, "elapsed_time": "1 day, 11:15:07", "remaining_time": "7:02:08", "throughput": 332.73, "total_tokens": 42226432} {"current_steps": 33350, "total_steps": 40000, "loss": 0.0536, "lr": 0.020004003510200284, "epoch": 1.629516527007549, "percentage": 83.38, "elapsed_time": "1 day, 11:15:10", "remaining_time": "7:01:46", "throughput": 332.78, "total_tokens": 42232896} {"current_steps": 33355, "total_steps": 40000, "loss": 0.0408, "lr": 0.019974623895057407, "epoch": 1.6297608286712433, "percentage": 83.39, "elapsed_time": "1 day, 11:15:13", "remaining_time": "7:01:23", "throughput": 332.82, "total_tokens": 42239168} {"current_steps": 33360, "total_steps": 40000, "loss": 0.0606, "lr": 0.019945264331461553, "epoch": 1.6300051303349377, "percentage": 83.4, "elapsed_time": "1 day, 11:15:16", "remaining_time": "7:01:01", "throughput": 332.86, "total_tokens": 42245280} {"current_steps": 33365, "total_steps": 40000, "loss": 0.0686, "lr": 0.019915924823940317, "epoch": 1.630249431998632, "percentage": 83.41, "elapsed_time": "1 day, 11:15:19", "remaining_time": "7:00:39", "throughput": 332.9, "total_tokens": 42251936} {"current_steps": 33370, "total_steps": 40000, "loss": 0.0461, "lr": 0.01988660537701816, "epoch": 1.6304937336623262, "percentage": 83.43, "elapsed_time": "1 day, 11:15:22", "remaining_time": "7:00:17", "throughput": 332.95, "total_tokens": 42258560} {"current_steps": 33375, "total_steps": 40000, "loss": 0.0435, "lr": 0.01985730599521659, "epoch": 1.6307380353260206, "percentage": 83.44, "elapsed_time": "1 day, 11:15:25", "remaining_time": "6:59:55", "throughput": 332.99, "total_tokens": 42264640} {"current_steps": 33380, "total_steps": 40000, "loss": 0.0702, "lr": 0.019828026683053918, "epoch": 1.630982336989715, "percentage": 83.45, "elapsed_time": "1 day, 11:15:28", "remaining_time": "6:59:32", "throughput": 333.03, "total_tokens": 42271008} {"current_steps": 33385, "total_steps": 40000, "loss": 0.0523, "lr": 0.01979876744504535, "epoch": 1.6312266386534091, "percentage": 83.46, "elapsed_time": "1 day, 11:15:31", "remaining_time": "6:59:10", "throughput": 333.07, "total_tokens": 42277184} {"current_steps": 33390, "total_steps": 40000, "loss": 0.0994, "lr": 0.019769528285703046, "epoch": 1.6314709403171035, "percentage": 83.47, "elapsed_time": "1 day, 11:15:34", "remaining_time": "6:58:48", "throughput": 333.11, "total_tokens": 42283040} {"current_steps": 33395, "total_steps": 40000, "loss": 0.0465, "lr": 0.019740309209536098, "epoch": 1.6317152419807979, "percentage": 83.49, "elapsed_time": "1 day, 11:15:37", "remaining_time": "6:58:26", "throughput": 333.15, "total_tokens": 42289056} {"current_steps": 33400, "total_steps": 40000, "loss": 0.058, "lr": 0.019711110221050387, "epoch": 1.6319595436444922, "percentage": 83.5, "elapsed_time": "1 day, 11:15:41", "remaining_time": "6:58:04", "throughput": 333.19, "total_tokens": 42295520} {"current_steps": 33400, "total_steps": 40000, "eval_loss": 0.06121977046132088, "epoch": 1.6319595436444922, "percentage": 83.5, "elapsed_time": "1 day, 11:26:15", "remaining_time": "7:00:09", "throughput": 331.53, "total_tokens": 42295520} {"current_steps": 33405, "total_steps": 40000, "loss": 0.0582, "lr": 0.019681931324748825, "epoch": 1.6322038453081866, "percentage": 83.51, "elapsed_time": "1 day, 11:26:27", "remaining_time": "6:59:48", "throughput": 331.55, "total_tokens": 42301920} {"current_steps": 33410, "total_steps": 40000, "loss": 0.0586, "lr": 0.019652772525131094, "epoch": 1.632448146971881, "percentage": 83.53, "elapsed_time": "1 day, 11:26:30", "remaining_time": "6:59:26", "throughput": 331.59, "total_tokens": 42307872} {"current_steps": 33415, "total_steps": 40000, "loss": 0.0381, "lr": 0.019623633826693885, "epoch": 1.6326924486355752, "percentage": 83.54, "elapsed_time": "1 day, 11:26:33", "remaining_time": "6:59:04", "throughput": 331.63, "total_tokens": 42314336} {"current_steps": 33420, "total_steps": 40000, "loss": 0.0648, "lr": 0.019594515233930788, "epoch": 1.6329367502992695, "percentage": 83.55, "elapsed_time": "1 day, 11:26:36", "remaining_time": "6:58:42", "throughput": 331.68, "total_tokens": 42320576} {"current_steps": 33425, "total_steps": 40000, "loss": 0.0292, "lr": 0.019565416751332186, "epoch": 1.6331810519629637, "percentage": 83.56, "elapsed_time": "1 day, 11:26:39", "remaining_time": "6:58:19", "throughput": 331.71, "total_tokens": 42326560} {"current_steps": 33430, "total_steps": 40000, "loss": 0.0504, "lr": 0.019536338383385497, "epoch": 1.633425353626658, "percentage": 83.58, "elapsed_time": "1 day, 11:26:42", "remaining_time": "6:57:57", "throughput": 331.75, "total_tokens": 42332672} {"current_steps": 33435, "total_steps": 40000, "loss": 0.0534, "lr": 0.019507280134574933, "epoch": 1.6336696552903525, "percentage": 83.59, "elapsed_time": "1 day, 11:26:45", "remaining_time": "6:57:35", "throughput": 331.8, "total_tokens": 42339040} {"current_steps": 33440, "total_steps": 40000, "loss": 0.0389, "lr": 0.019478242009381624, "epoch": 1.6339139569540468, "percentage": 83.6, "elapsed_time": "1 day, 11:26:48", "remaining_time": "6:57:13", "throughput": 331.84, "total_tokens": 42345472} {"current_steps": 33445, "total_steps": 40000, "loss": 0.0895, "lr": 0.01944922401228367, "epoch": 1.6341582586177412, "percentage": 83.61, "elapsed_time": "1 day, 11:26:51", "remaining_time": "6:56:50", "throughput": 331.88, "total_tokens": 42351616} {"current_steps": 33450, "total_steps": 40000, "loss": 0.0764, "lr": 0.01942022614775593, "epoch": 1.6344025602814356, "percentage": 83.62, "elapsed_time": "1 day, 11:26:54", "remaining_time": "6:56:28", "throughput": 331.92, "total_tokens": 42357696} {"current_steps": 33455, "total_steps": 40000, "loss": 0.0425, "lr": 0.01939124842027029, "epoch": 1.63464686194513, "percentage": 83.64, "elapsed_time": "1 day, 11:26:57", "remaining_time": "6:56:06", "throughput": 331.96, "total_tokens": 42363904} {"current_steps": 33460, "total_steps": 40000, "loss": 0.0459, "lr": 0.01936229083429551, "epoch": 1.6348911636088241, "percentage": 83.65, "elapsed_time": "1 day, 11:27:00", "remaining_time": "6:55:44", "throughput": 332.0, "total_tokens": 42369888} {"current_steps": 33465, "total_steps": 40000, "loss": 0.0522, "lr": 0.019333353394297148, "epoch": 1.6351354652725185, "percentage": 83.66, "elapsed_time": "1 day, 11:27:03", "remaining_time": "6:55:22", "throughput": 332.04, "total_tokens": 42376640} {"current_steps": 33470, "total_steps": 40000, "loss": 0.0798, "lr": 0.019304436104737754, "epoch": 1.6353797669362127, "percentage": 83.67, "elapsed_time": "1 day, 11:27:06", "remaining_time": "6:54:59", "throughput": 332.09, "total_tokens": 42382944} {"current_steps": 33475, "total_steps": 40000, "loss": 0.0326, "lr": 0.019275538970076778, "epoch": 1.635624068599907, "percentage": 83.69, "elapsed_time": "1 day, 11:27:09", "remaining_time": "6:54:37", "throughput": 332.13, "total_tokens": 42389440} {"current_steps": 33480, "total_steps": 40000, "loss": 0.0463, "lr": 0.019246661994770434, "epoch": 1.6358683702636014, "percentage": 83.7, "elapsed_time": "1 day, 11:27:12", "remaining_time": "6:54:15", "throughput": 332.17, "total_tokens": 42395584} {"current_steps": 33485, "total_steps": 40000, "loss": 0.0662, "lr": 0.019217805183271985, "epoch": 1.6361126719272958, "percentage": 83.71, "elapsed_time": "1 day, 11:27:15", "remaining_time": "6:53:53", "throughput": 332.21, "total_tokens": 42401728} {"current_steps": 33490, "total_steps": 40000, "loss": 0.0563, "lr": 0.019188968540031465, "epoch": 1.6363569735909902, "percentage": 83.73, "elapsed_time": "1 day, 11:27:19", "remaining_time": "6:53:31", "throughput": 332.25, "total_tokens": 42408480} {"current_steps": 33495, "total_steps": 40000, "loss": 0.0514, "lr": 0.019160152069495867, "epoch": 1.6366012752546846, "percentage": 83.74, "elapsed_time": "1 day, 11:27:22", "remaining_time": "6:53:09", "throughput": 332.3, "total_tokens": 42415104} {"current_steps": 33500, "total_steps": 40000, "loss": 0.05, "lr": 0.019131355776109103, "epoch": 1.636845576918379, "percentage": 83.75, "elapsed_time": "1 day, 11:27:25", "remaining_time": "6:52:46", "throughput": 332.34, "total_tokens": 42421504} {"current_steps": 33505, "total_steps": 40000, "loss": 0.0426, "lr": 0.019102579664311857, "epoch": 1.637089878582073, "percentage": 83.76, "elapsed_time": "1 day, 11:27:28", "remaining_time": "6:52:24", "throughput": 332.38, "total_tokens": 42428032} {"current_steps": 33510, "total_steps": 40000, "loss": 0.0614, "lr": 0.019073823738541763, "epoch": 1.6373341802457675, "percentage": 83.78, "elapsed_time": "1 day, 11:27:31", "remaining_time": "6:52:02", "throughput": 332.42, "total_tokens": 42433920} {"current_steps": 33515, "total_steps": 40000, "loss": 0.0587, "lr": 0.0190450880032334, "epoch": 1.6375784819094616, "percentage": 83.79, "elapsed_time": "1 day, 11:27:34", "remaining_time": "6:51:40", "throughput": 332.46, "total_tokens": 42440288} {"current_steps": 33520, "total_steps": 40000, "loss": 0.0409, "lr": 0.019016372462818114, "epoch": 1.637822783573156, "percentage": 83.8, "elapsed_time": "1 day, 11:27:37", "remaining_time": "6:51:18", "throughput": 332.5, "total_tokens": 42446752} {"current_steps": 33525, "total_steps": 40000, "loss": 0.0917, "lr": 0.018987677121724278, "epoch": 1.6380670852368504, "percentage": 83.81, "elapsed_time": "1 day, 11:27:40", "remaining_time": "6:50:56", "throughput": 332.55, "total_tokens": 42452992} {"current_steps": 33530, "total_steps": 40000, "loss": 0.0605, "lr": 0.018959001984377, "epoch": 1.6383113869005448, "percentage": 83.83, "elapsed_time": "1 day, 11:27:43", "remaining_time": "6:50:34", "throughput": 332.59, "total_tokens": 42459552} {"current_steps": 33535, "total_steps": 40000, "loss": 0.0428, "lr": 0.018930347055198377, "epoch": 1.6385556885642392, "percentage": 83.84, "elapsed_time": "1 day, 11:27:46", "remaining_time": "6:50:12", "throughput": 332.63, "total_tokens": 42465728} {"current_steps": 33540, "total_steps": 40000, "loss": 0.0656, "lr": 0.01890171233860739, "epoch": 1.6387999902279335, "percentage": 83.85, "elapsed_time": "1 day, 11:27:49", "remaining_time": "6:49:49", "throughput": 332.67, "total_tokens": 42472096} {"current_steps": 33545, "total_steps": 40000, "loss": 0.052, "lr": 0.018873097839019807, "epoch": 1.639044291891628, "percentage": 83.86, "elapsed_time": "1 day, 11:27:52", "remaining_time": "6:49:27", "throughput": 332.71, "total_tokens": 42478336} {"current_steps": 33550, "total_steps": 40000, "loss": 0.0799, "lr": 0.0188445035608484, "epoch": 1.639288593555322, "percentage": 83.88, "elapsed_time": "1 day, 11:27:56", "remaining_time": "6:49:05", "throughput": 332.76, "total_tokens": 42484992} {"current_steps": 33555, "total_steps": 40000, "loss": 0.0538, "lr": 0.018815929508502777, "epoch": 1.6395328952190165, "percentage": 83.89, "elapsed_time": "1 day, 11:27:59", "remaining_time": "6:48:43", "throughput": 332.8, "total_tokens": 42491072} {"current_steps": 33560, "total_steps": 40000, "loss": 0.0553, "lr": 0.01878737568638934, "epoch": 1.6397771968827106, "percentage": 83.9, "elapsed_time": "1 day, 11:28:02", "remaining_time": "6:48:21", "throughput": 332.84, "total_tokens": 42497344} {"current_steps": 33565, "total_steps": 40000, "loss": 0.0284, "lr": 0.01875884209891152, "epoch": 1.640021498546405, "percentage": 83.91, "elapsed_time": "1 day, 11:28:05", "remaining_time": "6:47:59", "throughput": 332.88, "total_tokens": 42503520} {"current_steps": 33570, "total_steps": 40000, "loss": 0.0519, "lr": 0.018730328750469514, "epoch": 1.6402658002100994, "percentage": 83.93, "elapsed_time": "1 day, 11:28:08", "remaining_time": "6:47:37", "throughput": 332.92, "total_tokens": 42510048} {"current_steps": 33575, "total_steps": 40000, "loss": 0.0659, "lr": 0.018701835645460473, "epoch": 1.6405101018737938, "percentage": 83.94, "elapsed_time": "1 day, 11:28:11", "remaining_time": "6:47:15", "throughput": 332.96, "total_tokens": 42516128} {"current_steps": 33580, "total_steps": 40000, "loss": 0.0407, "lr": 0.01867336278827838, "epoch": 1.6407544035374881, "percentage": 83.95, "elapsed_time": "1 day, 11:28:14", "remaining_time": "6:46:53", "throughput": 333.0, "total_tokens": 42522432} {"current_steps": 33585, "total_steps": 40000, "loss": 0.0623, "lr": 0.018644910183314056, "epoch": 1.6409987052011825, "percentage": 83.96, "elapsed_time": "1 day, 11:28:17", "remaining_time": "6:46:31", "throughput": 333.04, "total_tokens": 42528992} {"current_steps": 33590, "total_steps": 40000, "loss": 0.0733, "lr": 0.01861647783495531, "epoch": 1.641243006864877, "percentage": 83.97, "elapsed_time": "1 day, 11:28:20", "remaining_time": "6:46:09", "throughput": 333.09, "total_tokens": 42535232} {"current_steps": 33595, "total_steps": 40000, "loss": 0.0446, "lr": 0.01858806574758676, "epoch": 1.641487308528571, "percentage": 83.99, "elapsed_time": "1 day, 11:28:23", "remaining_time": "6:45:47", "throughput": 333.12, "total_tokens": 42541216} {"current_steps": 33600, "total_steps": 40000, "loss": 0.0525, "lr": 0.01855967392558988, "epoch": 1.6417316101922654, "percentage": 84.0, "elapsed_time": "1 day, 11:28:26", "remaining_time": "6:45:25", "throughput": 333.17, "total_tokens": 42547680} {"current_steps": 33600, "total_steps": 40000, "eval_loss": 0.061041656881570816, "epoch": 1.6417316101922654, "percentage": 84.0, "elapsed_time": "1 day, 11:39:00", "remaining_time": "6:47:25", "throughput": 331.52, "total_tokens": 42547680} {"current_steps": 33605, "total_steps": 40000, "loss": 0.0462, "lr": 0.018531302373343096, "epoch": 1.6419759118559596, "percentage": 84.01, "elapsed_time": "1 day, 11:39:05", "remaining_time": "6:47:03", "throughput": 331.56, "total_tokens": 42553728} {"current_steps": 33610, "total_steps": 40000, "loss": 0.0442, "lr": 0.018502951095221588, "epoch": 1.642220213519654, "percentage": 84.03, "elapsed_time": "1 day, 11:39:08", "remaining_time": "6:46:41", "throughput": 331.6, "total_tokens": 42559936} {"current_steps": 33615, "total_steps": 40000, "loss": 0.0443, "lr": 0.01847462009559751, "epoch": 1.6424645151833484, "percentage": 84.04, "elapsed_time": "1 day, 11:39:11", "remaining_time": "6:46:19", "throughput": 331.64, "total_tokens": 42566080} {"current_steps": 33620, "total_steps": 40000, "loss": 0.0573, "lr": 0.01844630937883992, "epoch": 1.6427088168470427, "percentage": 84.05, "elapsed_time": "1 day, 11:39:14", "remaining_time": "6:45:57", "throughput": 331.68, "total_tokens": 42572288} {"current_steps": 33625, "total_steps": 40000, "loss": 0.0852, "lr": 0.018418018949314573, "epoch": 1.642953118510737, "percentage": 84.06, "elapsed_time": "1 day, 11:39:17", "remaining_time": "6:45:35", "throughput": 331.72, "total_tokens": 42578496} {"current_steps": 33630, "total_steps": 40000, "loss": 0.0764, "lr": 0.018389748811384315, "epoch": 1.6431974201744315, "percentage": 84.08, "elapsed_time": "1 day, 11:39:20", "remaining_time": "6:45:13", "throughput": 331.76, "total_tokens": 42584320} {"current_steps": 33635, "total_steps": 40000, "loss": 0.0589, "lr": 0.018361498969408658, "epoch": 1.6434417218381259, "percentage": 84.09, "elapsed_time": "1 day, 11:39:23", "remaining_time": "6:44:51", "throughput": 331.8, "total_tokens": 42590688} {"current_steps": 33640, "total_steps": 40000, "loss": 0.0697, "lr": 0.01833326942774415, "epoch": 1.64368602350182, "percentage": 84.1, "elapsed_time": "1 day, 11:39:26", "remaining_time": "6:44:29", "throughput": 331.84, "total_tokens": 42597024} {"current_steps": 33645, "total_steps": 40000, "loss": 0.0487, "lr": 0.018305060190744155, "epoch": 1.6439303251655144, "percentage": 84.11, "elapsed_time": "1 day, 11:39:29", "remaining_time": "6:44:06", "throughput": 331.88, "total_tokens": 42603424} {"current_steps": 33650, "total_steps": 40000, "loss": 0.0691, "lr": 0.018276871262758846, "epoch": 1.6441746268292086, "percentage": 84.12, "elapsed_time": "1 day, 11:39:32", "remaining_time": "6:43:44", "throughput": 331.92, "total_tokens": 42609632} {"current_steps": 33655, "total_steps": 40000, "loss": 0.0579, "lr": 0.0182487026481353, "epoch": 1.644418928492903, "percentage": 84.14, "elapsed_time": "1 day, 11:39:35", "remaining_time": "6:43:22", "throughput": 331.97, "total_tokens": 42616544} {"current_steps": 33660, "total_steps": 40000, "loss": 0.0773, "lr": 0.018220554351217538, "epoch": 1.6446632301565973, "percentage": 84.15, "elapsed_time": "1 day, 11:39:38", "remaining_time": "6:43:00", "throughput": 332.01, "total_tokens": 42622848} {"current_steps": 33665, "total_steps": 40000, "loss": 0.0328, "lr": 0.01819242637634629, "epoch": 1.6449075318202917, "percentage": 84.16, "elapsed_time": "1 day, 11:39:41", "remaining_time": "6:42:38", "throughput": 332.05, "total_tokens": 42629216} {"current_steps": 33670, "total_steps": 40000, "loss": 0.0759, "lr": 0.01816431872785933, "epoch": 1.645151833483986, "percentage": 84.17, "elapsed_time": "1 day, 11:39:44", "remaining_time": "6:42:16", "throughput": 332.09, "total_tokens": 42634880} {"current_steps": 33675, "total_steps": 40000, "loss": 0.0602, "lr": 0.018136231410091148, "epoch": 1.6453961351476805, "percentage": 84.19, "elapsed_time": "1 day, 11:39:47", "remaining_time": "6:41:54", "throughput": 332.13, "total_tokens": 42641088} {"current_steps": 33680, "total_steps": 40000, "loss": 0.0546, "lr": 0.018108164427373175, "epoch": 1.6456404368113748, "percentage": 84.2, "elapsed_time": "1 day, 11:39:50", "remaining_time": "6:41:32", "throughput": 332.17, "total_tokens": 42647200} {"current_steps": 33685, "total_steps": 40000, "loss": 0.0566, "lr": 0.01808011778403375, "epoch": 1.645884738475069, "percentage": 84.21, "elapsed_time": "1 day, 11:39:53", "remaining_time": "6:41:10", "throughput": 332.21, "total_tokens": 42653088} {"current_steps": 33690, "total_steps": 40000, "loss": 0.0598, "lr": 0.01805209148439793, "epoch": 1.6461290401387634, "percentage": 84.23, "elapsed_time": "1 day, 11:39:56", "remaining_time": "6:40:48", "throughput": 332.25, "total_tokens": 42659264} {"current_steps": 33695, "total_steps": 40000, "loss": 0.0335, "lr": 0.018024085532787757, "epoch": 1.6463733418024575, "percentage": 84.24, "elapsed_time": "1 day, 11:39:59", "remaining_time": "6:40:26", "throughput": 332.28, "total_tokens": 42665248} {"current_steps": 33700, "total_steps": 40000, "loss": 0.0568, "lr": 0.017996099933522164, "epoch": 1.646617643466152, "percentage": 84.25, "elapsed_time": "1 day, 11:40:02", "remaining_time": "6:40:04", "throughput": 332.32, "total_tokens": 42671296} {"current_steps": 33705, "total_steps": 40000, "loss": 0.0412, "lr": 0.017968134690916775, "epoch": 1.6468619451298463, "percentage": 84.26, "elapsed_time": "1 day, 11:40:05", "remaining_time": "6:39:42", "throughput": 332.36, "total_tokens": 42677472} {"current_steps": 33710, "total_steps": 40000, "loss": 0.0469, "lr": 0.017940189809284263, "epoch": 1.6471062467935407, "percentage": 84.28, "elapsed_time": "1 day, 11:40:08", "remaining_time": "6:39:19", "throughput": 332.41, "total_tokens": 42684000} {"current_steps": 33715, "total_steps": 40000, "loss": 0.0628, "lr": 0.017912265292934024, "epoch": 1.647350548457235, "percentage": 84.29, "elapsed_time": "1 day, 11:40:11", "remaining_time": "6:38:57", "throughput": 332.45, "total_tokens": 42690304} {"current_steps": 33720, "total_steps": 40000, "loss": 0.0293, "lr": 0.017884361146172423, "epoch": 1.6475948501209294, "percentage": 84.3, "elapsed_time": "1 day, 11:40:14", "remaining_time": "6:38:35", "throughput": 332.49, "total_tokens": 42696544} {"current_steps": 33725, "total_steps": 40000, "loss": 0.068, "lr": 0.01785647737330261, "epoch": 1.6478391517846238, "percentage": 84.31, "elapsed_time": "1 day, 11:40:17", "remaining_time": "6:38:13", "throughput": 332.53, "total_tokens": 42703008} {"current_steps": 33730, "total_steps": 40000, "loss": 0.0557, "lr": 0.017828613978624563, "epoch": 1.648083453448318, "percentage": 84.33, "elapsed_time": "1 day, 11:40:20", "remaining_time": "6:37:51", "throughput": 332.57, "total_tokens": 42709152} {"current_steps": 33735, "total_steps": 40000, "loss": 0.0531, "lr": 0.01780077096643523, "epoch": 1.6483277551120123, "percentage": 84.34, "elapsed_time": "1 day, 11:40:24", "remaining_time": "6:37:29", "throughput": 332.61, "total_tokens": 42715680} {"current_steps": 33740, "total_steps": 40000, "loss": 0.0515, "lr": 0.017772948341028345, "epoch": 1.6485720567757065, "percentage": 84.35, "elapsed_time": "1 day, 11:40:27", "remaining_time": "6:37:07", "throughput": 332.65, "total_tokens": 42721856} {"current_steps": 33745, "total_steps": 40000, "loss": 0.0583, "lr": 0.01774514610669447, "epoch": 1.6488163584394009, "percentage": 84.36, "elapsed_time": "1 day, 11:40:30", "remaining_time": "6:36:45", "throughput": 332.7, "total_tokens": 42728064} {"current_steps": 33750, "total_steps": 40000, "loss": 0.0534, "lr": 0.017717364267721112, "epoch": 1.6490606601030953, "percentage": 84.38, "elapsed_time": "1 day, 11:40:33", "remaining_time": "6:36:23", "throughput": 332.74, "total_tokens": 42734336} {"current_steps": 33755, "total_steps": 40000, "loss": 0.0565, "lr": 0.017689602828392513, "epoch": 1.6493049617667896, "percentage": 84.39, "elapsed_time": "1 day, 11:40:36", "remaining_time": "6:36:01", "throughput": 332.78, "total_tokens": 42740352} {"current_steps": 33760, "total_steps": 40000, "loss": 0.0902, "lr": 0.017661861792989897, "epoch": 1.649549263430484, "percentage": 84.4, "elapsed_time": "1 day, 11:40:39", "remaining_time": "6:35:39", "throughput": 332.82, "total_tokens": 42746496} {"current_steps": 33765, "total_steps": 40000, "loss": 0.0458, "lr": 0.017634141165791272, "epoch": 1.6497935650941784, "percentage": 84.41, "elapsed_time": "1 day, 11:40:42", "remaining_time": "6:35:17", "throughput": 332.86, "total_tokens": 42752992} {"current_steps": 33770, "total_steps": 40000, "loss": 0.0316, "lr": 0.017606440951071455, "epoch": 1.6500378667578728, "percentage": 84.42, "elapsed_time": "1 day, 11:40:45", "remaining_time": "6:34:56", "throughput": 332.9, "total_tokens": 42759232} {"current_steps": 33775, "total_steps": 40000, "loss": 0.074, "lr": 0.017578761153102213, "epoch": 1.650282168421567, "percentage": 84.44, "elapsed_time": "1 day, 11:40:48", "remaining_time": "6:34:34", "throughput": 332.94, "total_tokens": 42765376} {"current_steps": 33780, "total_steps": 40000, "loss": 0.0585, "lr": 0.017551101776152146, "epoch": 1.6505264700852613, "percentage": 84.45, "elapsed_time": "1 day, 11:40:51", "remaining_time": "6:34:12", "throughput": 332.98, "total_tokens": 42771616} {"current_steps": 33785, "total_steps": 40000, "loss": 0.0386, "lr": 0.017523462824486608, "epoch": 1.6507707717489555, "percentage": 84.46, "elapsed_time": "1 day, 11:40:54", "remaining_time": "6:33:50", "throughput": 333.02, "total_tokens": 42777856} {"current_steps": 33790, "total_steps": 40000, "loss": 0.0436, "lr": 0.01749584430236794, "epoch": 1.6510150734126499, "percentage": 84.47, "elapsed_time": "1 day, 11:40:57", "remaining_time": "6:33:28", "throughput": 333.06, "total_tokens": 42784544} {"current_steps": 33795, "total_steps": 40000, "loss": 0.0589, "lr": 0.01746824621405524, "epoch": 1.6512593750763442, "percentage": 84.49, "elapsed_time": "1 day, 11:41:00", "remaining_time": "6:33:06", "throughput": 333.1, "total_tokens": 42790752} {"current_steps": 33800, "total_steps": 40000, "loss": 0.0646, "lr": 0.017440668563804412, "epoch": 1.6515036767400386, "percentage": 84.5, "elapsed_time": "1 day, 11:41:03", "remaining_time": "6:32:44", "throughput": 333.14, "total_tokens": 42796992} {"current_steps": 33800, "total_steps": 40000, "eval_loss": 0.06084033474326134, "epoch": 1.6515036767400386, "percentage": 84.5, "elapsed_time": "1 day, 11:51:37", "remaining_time": "6:34:40", "throughput": 331.51, "total_tokens": 42796992} {"current_steps": 33805, "total_steps": 40000, "loss": 0.07, "lr": 0.017413111355868392, "epoch": 1.651747978403733, "percentage": 84.51, "elapsed_time": "1 day, 11:51:41", "remaining_time": "6:34:18", "throughput": 331.56, "total_tokens": 42804224} {"current_steps": 33810, "total_steps": 40000, "loss": 0.0765, "lr": 0.017385574594496748, "epoch": 1.6519922800674274, "percentage": 84.52, "elapsed_time": "1 day, 11:51:44", "remaining_time": "6:33:56", "throughput": 331.6, "total_tokens": 42810496} {"current_steps": 33815, "total_steps": 40000, "loss": 0.0705, "lr": 0.01735805828393605, "epoch": 1.6522365817311215, "percentage": 84.54, "elapsed_time": "1 day, 11:51:47", "remaining_time": "6:33:34", "throughput": 331.64, "total_tokens": 42816576} {"current_steps": 33820, "total_steps": 40000, "loss": 0.0704, "lr": 0.017330562428429667, "epoch": 1.652480883394816, "percentage": 84.55, "elapsed_time": "1 day, 11:51:50", "remaining_time": "6:33:12", "throughput": 331.67, "total_tokens": 42822560} {"current_steps": 33825, "total_steps": 40000, "loss": 0.0509, "lr": 0.01730308703221776, "epoch": 1.6527251850585103, "percentage": 84.56, "elapsed_time": "1 day, 11:51:53", "remaining_time": "6:32:50", "throughput": 331.71, "total_tokens": 42828864} {"current_steps": 33830, "total_steps": 40000, "loss": 0.0514, "lr": 0.01727563209953744, "epoch": 1.6529694867222045, "percentage": 84.58, "elapsed_time": "1 day, 11:51:56", "remaining_time": "6:32:28", "throughput": 331.76, "total_tokens": 42835360} {"current_steps": 33835, "total_steps": 40000, "loss": 0.0573, "lr": 0.017248197634622535, "epoch": 1.6532137883858988, "percentage": 84.59, "elapsed_time": "1 day, 11:51:59", "remaining_time": "6:32:06", "throughput": 331.8, "total_tokens": 42841888} {"current_steps": 33840, "total_steps": 40000, "loss": 0.0713, "lr": 0.01722078364170383, "epoch": 1.6534580900495932, "percentage": 84.6, "elapsed_time": "1 day, 11:52:02", "remaining_time": "6:31:44", "throughput": 331.84, "total_tokens": 42848320} {"current_steps": 33845, "total_steps": 40000, "loss": 0.0534, "lr": 0.017193390125008905, "epoch": 1.6537023917132876, "percentage": 84.61, "elapsed_time": "1 day, 11:52:05", "remaining_time": "6:31:22", "throughput": 331.88, "total_tokens": 42854848} {"current_steps": 33850, "total_steps": 40000, "loss": 0.0597, "lr": 0.017166017088762153, "epoch": 1.653946693376982, "percentage": 84.62, "elapsed_time": "1 day, 11:52:08", "remaining_time": "6:31:00", "throughput": 331.92, "total_tokens": 42861088} {"current_steps": 33855, "total_steps": 40000, "loss": 0.0442, "lr": 0.017138664537184878, "epoch": 1.6541909950406763, "percentage": 84.64, "elapsed_time": "1 day, 11:52:11", "remaining_time": "6:30:38", "throughput": 331.96, "total_tokens": 42867136} {"current_steps": 33860, "total_steps": 40000, "loss": 0.0468, "lr": 0.017111332474495172, "epoch": 1.6544352967043705, "percentage": 84.65, "elapsed_time": "1 day, 11:52:15", "remaining_time": "6:30:16", "throughput": 332.01, "total_tokens": 42873504} {"current_steps": 33865, "total_steps": 40000, "loss": 0.0516, "lr": 0.017084020904907998, "epoch": 1.6546795983680649, "percentage": 84.66, "elapsed_time": "1 day, 11:52:18", "remaining_time": "6:29:54", "throughput": 332.05, "total_tokens": 42879712} {"current_steps": 33870, "total_steps": 40000, "loss": 0.0622, "lr": 0.017056729832635103, "epoch": 1.6549239000317593, "percentage": 84.67, "elapsed_time": "1 day, 11:52:21", "remaining_time": "6:29:32", "throughput": 332.08, "total_tokens": 42885824} {"current_steps": 33875, "total_steps": 40000, "loss": 0.0493, "lr": 0.017029459261885153, "epoch": 1.6551682016954534, "percentage": 84.69, "elapsed_time": "1 day, 11:52:24", "remaining_time": "6:29:10", "throughput": 332.12, "total_tokens": 42891968} {"current_steps": 33880, "total_steps": 40000, "loss": 0.0691, "lr": 0.01700220919686359, "epoch": 1.6554125033591478, "percentage": 84.7, "elapsed_time": "1 day, 11:52:27", "remaining_time": "6:28:48", "throughput": 332.16, "total_tokens": 42898144} {"current_steps": 33885, "total_steps": 40000, "loss": 0.0615, "lr": 0.016974979641772723, "epoch": 1.6556568050228422, "percentage": 84.71, "elapsed_time": "1 day, 11:52:30", "remaining_time": "6:28:26", "throughput": 332.2, "total_tokens": 42904320} {"current_steps": 33890, "total_steps": 40000, "loss": 0.0681, "lr": 0.01694777060081169, "epoch": 1.6559011066865366, "percentage": 84.72, "elapsed_time": "1 day, 11:52:33", "remaining_time": "6:28:04", "throughput": 332.25, "total_tokens": 42910560} {"current_steps": 33895, "total_steps": 40000, "loss": 0.0977, "lr": 0.016920582078176444, "epoch": 1.656145408350231, "percentage": 84.74, "elapsed_time": "1 day, 11:52:36", "remaining_time": "6:27:42", "throughput": 332.28, "total_tokens": 42916576} {"current_steps": 33900, "total_steps": 40000, "loss": 0.0391, "lr": 0.016893414078059863, "epoch": 1.6563897100139253, "percentage": 84.75, "elapsed_time": "1 day, 11:52:39", "remaining_time": "6:27:21", "throughput": 332.32, "total_tokens": 42922848} {"current_steps": 33905, "total_steps": 40000, "loss": 0.0354, "lr": 0.016866266604651535, "epoch": 1.6566340116776195, "percentage": 84.76, "elapsed_time": "1 day, 11:52:42", "remaining_time": "6:26:59", "throughput": 332.37, "total_tokens": 42929248} {"current_steps": 33910, "total_steps": 40000, "loss": 0.0511, "lr": 0.016839139662137976, "epoch": 1.6568783133413139, "percentage": 84.78, "elapsed_time": "1 day, 11:52:45", "remaining_time": "6:26:37", "throughput": 332.41, "total_tokens": 42935776} {"current_steps": 33915, "total_steps": 40000, "loss": 0.0423, "lr": 0.01681203325470245, "epoch": 1.6571226150050082, "percentage": 84.79, "elapsed_time": "1 day, 11:52:48", "remaining_time": "6:26:15", "throughput": 332.45, "total_tokens": 42942016} {"current_steps": 33920, "total_steps": 40000, "loss": 0.0623, "lr": 0.016784947386525157, "epoch": 1.6573669166687024, "percentage": 84.8, "elapsed_time": "1 day, 11:52:51", "remaining_time": "6:25:53", "throughput": 332.49, "total_tokens": 42948512} {"current_steps": 33925, "total_steps": 40000, "loss": 0.0373, "lr": 0.01675788206178308, "epoch": 1.6576112183323968, "percentage": 84.81, "elapsed_time": "1 day, 11:52:54", "remaining_time": "6:25:31", "throughput": 332.53, "total_tokens": 42954880} {"current_steps": 33930, "total_steps": 40000, "loss": 0.0419, "lr": 0.016730837284649986, "epoch": 1.6578555199960912, "percentage": 84.82, "elapsed_time": "1 day, 11:52:57", "remaining_time": "6:25:09", "throughput": 332.57, "total_tokens": 42960992} {"current_steps": 33935, "total_steps": 40000, "loss": 0.0789, "lr": 0.016703813059296583, "epoch": 1.6580998216597855, "percentage": 84.84, "elapsed_time": "1 day, 11:53:00", "remaining_time": "6:24:47", "throughput": 332.61, "total_tokens": 42966912} {"current_steps": 33940, "total_steps": 40000, "loss": 0.0349, "lr": 0.016676809389890294, "epoch": 1.65834412332348, "percentage": 84.85, "elapsed_time": "1 day, 11:53:03", "remaining_time": "6:24:25", "throughput": 332.65, "total_tokens": 42972960} {"current_steps": 33945, "total_steps": 40000, "loss": 0.0515, "lr": 0.016649826280595435, "epoch": 1.6585884249871743, "percentage": 84.86, "elapsed_time": "1 day, 11:53:06", "remaining_time": "6:24:03", "throughput": 332.69, "total_tokens": 42979264} {"current_steps": 33950, "total_steps": 40000, "loss": 0.0648, "lr": 0.016622863735573163, "epoch": 1.6588327266508684, "percentage": 84.88, "elapsed_time": "1 day, 11:53:09", "remaining_time": "6:23:42", "throughput": 332.73, "total_tokens": 42985376} {"current_steps": 33955, "total_steps": 40000, "loss": 0.0373, "lr": 0.016595921758981395, "epoch": 1.6590770283145628, "percentage": 84.89, "elapsed_time": "1 day, 11:53:13", "remaining_time": "6:23:20", "throughput": 332.77, "total_tokens": 42992128} {"current_steps": 33960, "total_steps": 40000, "loss": 0.0585, "lr": 0.01656900035497495, "epoch": 1.659321329978257, "percentage": 84.9, "elapsed_time": "1 day, 11:53:16", "remaining_time": "6:22:58", "throughput": 332.82, "total_tokens": 42999232} {"current_steps": 33965, "total_steps": 40000, "loss": 0.0536, "lr": 0.016542099527705485, "epoch": 1.6595656316419514, "percentage": 84.91, "elapsed_time": "1 day, 11:53:19", "remaining_time": "6:22:36", "throughput": 332.86, "total_tokens": 43005632} {"current_steps": 33970, "total_steps": 40000, "loss": 0.0601, "lr": 0.01651521928132138, "epoch": 1.6598099333056457, "percentage": 84.92, "elapsed_time": "1 day, 11:53:22", "remaining_time": "6:22:14", "throughput": 332.9, "total_tokens": 43011968} {"current_steps": 33975, "total_steps": 40000, "loss": 0.0695, "lr": 0.01648835961996794, "epoch": 1.6600542349693401, "percentage": 84.94, "elapsed_time": "1 day, 11:53:25", "remaining_time": "6:21:52", "throughput": 332.94, "total_tokens": 43018048} {"current_steps": 33980, "total_steps": 40000, "loss": 0.038, "lr": 0.016461520547787285, "epoch": 1.6602985366330345, "percentage": 84.95, "elapsed_time": "1 day, 11:53:28", "remaining_time": "6:21:30", "throughput": 332.98, "total_tokens": 43024480} {"current_steps": 33985, "total_steps": 40000, "loss": 0.0428, "lr": 0.016434702068918266, "epoch": 1.6605428382967289, "percentage": 84.96, "elapsed_time": "1 day, 11:53:31", "remaining_time": "6:21:09", "throughput": 333.03, "total_tokens": 43030784} {"current_steps": 33990, "total_steps": 40000, "loss": 0.0687, "lr": 0.01640790418749673, "epoch": 1.6607871399604233, "percentage": 84.97, "elapsed_time": "1 day, 11:53:34", "remaining_time": "6:20:47", "throughput": 333.07, "total_tokens": 43036928} {"current_steps": 33995, "total_steps": 40000, "loss": 0.0584, "lr": 0.016381126907655134, "epoch": 1.6610314416241174, "percentage": 84.99, "elapsed_time": "1 day, 11:53:37", "remaining_time": "6:20:25", "throughput": 333.11, "total_tokens": 43043488} {"current_steps": 34000, "total_steps": 40000, "loss": 0.0453, "lr": 0.016354370233522948, "epoch": 1.6612757432878118, "percentage": 85.0, "elapsed_time": "1 day, 11:53:40", "remaining_time": "6:20:03", "throughput": 333.15, "total_tokens": 43049888} {"current_steps": 34000, "total_steps": 40000, "eval_loss": 0.06115463003516197, "epoch": 1.6612757432878118, "percentage": 85.0, "elapsed_time": "1 day, 12:04:14", "remaining_time": "6:21:55", "throughput": 331.52, "total_tokens": 43049888} {"current_steps": 34005, "total_steps": 40000, "loss": 0.0647, "lr": 0.016327634169226394, "epoch": 1.661520044951506, "percentage": 85.01, "elapsed_time": "1 day, 12:04:19", "remaining_time": "6:21:33", "throughput": 331.56, "total_tokens": 43056416} {"current_steps": 34010, "total_steps": 40000, "loss": 0.0566, "lr": 0.016300918718888485, "epoch": 1.6617643466152003, "percentage": 85.02, "elapsed_time": "1 day, 12:04:22", "remaining_time": "6:21:11", "throughput": 331.6, "total_tokens": 43062592} {"current_steps": 34015, "total_steps": 40000, "loss": 0.0544, "lr": 0.016274223886629052, "epoch": 1.6620086482788947, "percentage": 85.04, "elapsed_time": "1 day, 12:04:25", "remaining_time": "6:20:50", "throughput": 331.64, "total_tokens": 43068896} {"current_steps": 34020, "total_steps": 40000, "loss": 0.0381, "lr": 0.01624754967656482, "epoch": 1.662252949942589, "percentage": 85.05, "elapsed_time": "1 day, 12:04:28", "remaining_time": "6:20:28", "throughput": 331.68, "total_tokens": 43075264} {"current_steps": 34025, "total_steps": 40000, "loss": 0.0672, "lr": 0.016220896092809235, "epoch": 1.6624972516062835, "percentage": 85.06, "elapsed_time": "1 day, 12:04:31", "remaining_time": "6:20:06", "throughput": 331.72, "total_tokens": 43081504} {"current_steps": 34030, "total_steps": 40000, "loss": 0.0501, "lr": 0.01619426313947267, "epoch": 1.6627415532699779, "percentage": 85.08, "elapsed_time": "1 day, 12:04:34", "remaining_time": "6:19:44", "throughput": 331.77, "total_tokens": 43088192} {"current_steps": 34035, "total_steps": 40000, "loss": 0.0643, "lr": 0.016167650820662228, "epoch": 1.6629858549336722, "percentage": 85.09, "elapsed_time": "1 day, 12:04:37", "remaining_time": "6:19:22", "throughput": 331.81, "total_tokens": 43094400} {"current_steps": 34040, "total_steps": 40000, "loss": 0.0256, "lr": 0.016141059140481855, "epoch": 1.6632301565973664, "percentage": 85.1, "elapsed_time": "1 day, 12:04:40", "remaining_time": "6:19:00", "throughput": 331.85, "total_tokens": 43100832} {"current_steps": 34045, "total_steps": 40000, "loss": 0.0515, "lr": 0.016114488103032374, "epoch": 1.6634744582610608, "percentage": 85.11, "elapsed_time": "1 day, 12:04:43", "remaining_time": "6:18:38", "throughput": 331.89, "total_tokens": 43106880} {"current_steps": 34050, "total_steps": 40000, "loss": 0.0546, "lr": 0.016087937712411293, "epoch": 1.663718759924755, "percentage": 85.12, "elapsed_time": "1 day, 12:04:46", "remaining_time": "6:18:16", "throughput": 331.93, "total_tokens": 43112960} {"current_steps": 34055, "total_steps": 40000, "loss": 0.0486, "lr": 0.01606140797271308, "epoch": 1.6639630615884493, "percentage": 85.14, "elapsed_time": "1 day, 12:04:49", "remaining_time": "6:17:54", "throughput": 331.97, "total_tokens": 43119424} {"current_steps": 34060, "total_steps": 40000, "loss": 0.0553, "lr": 0.01603489888802897, "epoch": 1.6642073632521437, "percentage": 85.15, "elapsed_time": "1 day, 12:04:53", "remaining_time": "6:17:33", "throughput": 332.01, "total_tokens": 43126400} {"current_steps": 34065, "total_steps": 40000, "loss": 0.0414, "lr": 0.016008410462446918, "epoch": 1.664451664915838, "percentage": 85.16, "elapsed_time": "1 day, 12:04:56", "remaining_time": "6:17:11", "throughput": 332.06, "total_tokens": 43132960} {"current_steps": 34070, "total_steps": 40000, "loss": 0.0601, "lr": 0.01598194270005185, "epoch": 1.6646959665795324, "percentage": 85.17, "elapsed_time": "1 day, 12:04:59", "remaining_time": "6:16:49", "throughput": 332.1, "total_tokens": 43139328} {"current_steps": 34075, "total_steps": 40000, "loss": 0.0399, "lr": 0.015955495604925356, "epoch": 1.6649402682432268, "percentage": 85.19, "elapsed_time": "1 day, 12:05:02", "remaining_time": "6:16:27", "throughput": 332.14, "total_tokens": 43145440} {"current_steps": 34080, "total_steps": 40000, "loss": 0.0597, "lr": 0.01592906918114598, "epoch": 1.6651845699069212, "percentage": 85.2, "elapsed_time": "1 day, 12:05:05", "remaining_time": "6:16:05", "throughput": 332.18, "total_tokens": 43151520} {"current_steps": 34085, "total_steps": 40000, "loss": 0.064, "lr": 0.015902663432788965, "epoch": 1.6654288715706154, "percentage": 85.21, "elapsed_time": "1 day, 12:05:08", "remaining_time": "6:15:43", "throughput": 332.22, "total_tokens": 43157728} {"current_steps": 34090, "total_steps": 40000, "loss": 0.0667, "lr": 0.01587627836392643, "epoch": 1.6656731732343097, "percentage": 85.22, "elapsed_time": "1 day, 12:05:11", "remaining_time": "6:15:22", "throughput": 332.26, "total_tokens": 43164064} {"current_steps": 34095, "total_steps": 40000, "loss": 0.0448, "lr": 0.01584991397862726, "epoch": 1.665917474898004, "percentage": 85.24, "elapsed_time": "1 day, 12:05:14", "remaining_time": "6:15:00", "throughput": 332.3, "total_tokens": 43170528} {"current_steps": 34100, "total_steps": 40000, "loss": 0.0626, "lr": 0.015823570280957214, "epoch": 1.6661617765616983, "percentage": 85.25, "elapsed_time": "1 day, 12:05:17", "remaining_time": "6:14:38", "throughput": 332.34, "total_tokens": 43176992} {"current_steps": 34105, "total_steps": 40000, "loss": 0.0525, "lr": 0.015797247274978766, "epoch": 1.6664060782253927, "percentage": 85.26, "elapsed_time": "1 day, 12:05:20", "remaining_time": "6:14:16", "throughput": 332.38, "total_tokens": 43183136} {"current_steps": 34110, "total_steps": 40000, "loss": 0.0496, "lr": 0.015770944964751326, "epoch": 1.666650379889087, "percentage": 85.28, "elapsed_time": "1 day, 12:05:23", "remaining_time": "6:13:54", "throughput": 332.42, "total_tokens": 43189728} {"current_steps": 34115, "total_steps": 40000, "loss": 0.0431, "lr": 0.015744663354330956, "epoch": 1.6668946815527814, "percentage": 85.29, "elapsed_time": "1 day, 12:05:26", "remaining_time": "6:13:32", "throughput": 332.46, "total_tokens": 43195840} {"current_steps": 34120, "total_steps": 40000, "loss": 0.0591, "lr": 0.015718402447770664, "epoch": 1.6671389832164758, "percentage": 85.3, "elapsed_time": "1 day, 12:05:29", "remaining_time": "6:13:11", "throughput": 332.51, "total_tokens": 43202560} {"current_steps": 34125, "total_steps": 40000, "loss": 0.0372, "lr": 0.015692162249120224, "epoch": 1.6673832848801702, "percentage": 85.31, "elapsed_time": "1 day, 12:05:33", "remaining_time": "6:12:49", "throughput": 332.55, "total_tokens": 43208960} {"current_steps": 34130, "total_steps": 40000, "loss": 0.0458, "lr": 0.01566594276242615, "epoch": 1.6676275865438643, "percentage": 85.32, "elapsed_time": "1 day, 12:05:36", "remaining_time": "6:12:27", "throughput": 332.59, "total_tokens": 43215168} {"current_steps": 34135, "total_steps": 40000, "loss": 0.0941, "lr": 0.015639743991731857, "epoch": 1.6678718882075587, "percentage": 85.34, "elapsed_time": "1 day, 12:05:39", "remaining_time": "6:12:05", "throughput": 332.63, "total_tokens": 43221216} {"current_steps": 34140, "total_steps": 40000, "loss": 0.0406, "lr": 0.01561356594107755, "epoch": 1.6681161898712529, "percentage": 85.35, "elapsed_time": "1 day, 12:05:41", "remaining_time": "6:11:44", "throughput": 332.67, "total_tokens": 43227168} {"current_steps": 34145, "total_steps": 40000, "loss": 0.0756, "lr": 0.015587408614500147, "epoch": 1.6683604915349473, "percentage": 85.36, "elapsed_time": "1 day, 12:05:44", "remaining_time": "6:11:22", "throughput": 332.7, "total_tokens": 43233280} {"current_steps": 34150, "total_steps": 40000, "loss": 0.0558, "lr": 0.015561272016033505, "epoch": 1.6686047931986416, "percentage": 85.38, "elapsed_time": "1 day, 12:05:48", "remaining_time": "6:11:00", "throughput": 332.74, "total_tokens": 43239456} {"current_steps": 34155, "total_steps": 40000, "loss": 0.0362, "lr": 0.015535156149708167, "epoch": 1.668849094862336, "percentage": 85.39, "elapsed_time": "1 day, 12:05:51", "remaining_time": "6:10:38", "throughput": 332.78, "total_tokens": 43245312} {"current_steps": 34160, "total_steps": 40000, "loss": 0.0618, "lr": 0.015509061019551528, "epoch": 1.6690933965260304, "percentage": 85.4, "elapsed_time": "1 day, 12:05:54", "remaining_time": "6:10:16", "throughput": 332.82, "total_tokens": 43251584} {"current_steps": 34165, "total_steps": 40000, "loss": 0.0504, "lr": 0.015482986629587818, "epoch": 1.6693376981897248, "percentage": 85.41, "elapsed_time": "1 day, 12:05:57", "remaining_time": "6:09:55", "throughput": 332.86, "total_tokens": 43258112} {"current_steps": 34170, "total_steps": 40000, "loss": 0.0344, "lr": 0.01545693298383799, "epoch": 1.6695819998534192, "percentage": 85.42, "elapsed_time": "1 day, 12:06:00", "remaining_time": "6:09:33", "throughput": 332.91, "total_tokens": 43264512} {"current_steps": 34175, "total_steps": 40000, "loss": 0.041, "lr": 0.015430900086319858, "epoch": 1.6698263015171133, "percentage": 85.44, "elapsed_time": "1 day, 12:06:03", "remaining_time": "6:09:11", "throughput": 332.95, "total_tokens": 43270944} {"current_steps": 34180, "total_steps": 40000, "loss": 0.066, "lr": 0.015404887941048084, "epoch": 1.6700706031808077, "percentage": 85.45, "elapsed_time": "1 day, 12:06:06", "remaining_time": "6:08:50", "throughput": 332.99, "total_tokens": 43277760} {"current_steps": 34185, "total_steps": 40000, "loss": 0.0561, "lr": 0.01537889655203397, "epoch": 1.6703149048445018, "percentage": 85.46, "elapsed_time": "1 day, 12:06:09", "remaining_time": "6:08:28", "throughput": 333.03, "total_tokens": 43284064} {"current_steps": 34190, "total_steps": 40000, "loss": 0.0839, "lr": 0.015352925923285798, "epoch": 1.6705592065081962, "percentage": 85.47, "elapsed_time": "1 day, 12:06:12", "remaining_time": "6:08:06", "throughput": 333.07, "total_tokens": 43290528} {"current_steps": 34195, "total_steps": 40000, "loss": 0.103, "lr": 0.015326976058808511, "epoch": 1.6708035081718906, "percentage": 85.49, "elapsed_time": "1 day, 12:06:15", "remaining_time": "6:07:44", "throughput": 333.11, "total_tokens": 43296704} {"current_steps": 34200, "total_steps": 40000, "loss": 0.0443, "lr": 0.015301046962603908, "epoch": 1.671047809835585, "percentage": 85.5, "elapsed_time": "1 day, 12:06:18", "remaining_time": "6:07:23", "throughput": 333.16, "total_tokens": 43303328} {"current_steps": 34200, "total_steps": 40000, "eval_loss": 0.060991331934928894, "epoch": 1.671047809835585, "percentage": 85.5, "elapsed_time": "1 day, 12:16:52", "remaining_time": "6:09:10", "throughput": 331.54, "total_tokens": 43303328} {"current_steps": 34205, "total_steps": 40000, "loss": 0.0574, "lr": 0.015275138638670626, "epoch": 1.6712921114992794, "percentage": 85.51, "elapsed_time": "1 day, 12:16:56", "remaining_time": "6:08:49", "throughput": 331.58, "total_tokens": 43309952} {"current_steps": 34210, "total_steps": 40000, "loss": 0.0534, "lr": 0.015249251091004001, "epoch": 1.6715364131629737, "percentage": 85.52, "elapsed_time": "1 day, 12:16:59", "remaining_time": "6:08:27", "throughput": 331.62, "total_tokens": 43316416} {"current_steps": 34215, "total_steps": 40000, "loss": 0.0481, "lr": 0.01522338432359624, "epoch": 1.6717807148266681, "percentage": 85.54, "elapsed_time": "1 day, 12:17:02", "remaining_time": "6:08:05", "throughput": 331.66, "total_tokens": 43322784} {"current_steps": 34220, "total_steps": 40000, "loss": 0.0465, "lr": 0.01519753834043635, "epoch": 1.6720250164903623, "percentage": 85.55, "elapsed_time": "1 day, 12:17:06", "remaining_time": "6:07:43", "throughput": 331.7, "total_tokens": 43329280} {"current_steps": 34225, "total_steps": 40000, "loss": 0.0303, "lr": 0.015171713145510095, "epoch": 1.6722693181540567, "percentage": 85.56, "elapsed_time": "1 day, 12:17:09", "remaining_time": "6:07:21", "throughput": 331.74, "total_tokens": 43335360} {"current_steps": 34230, "total_steps": 40000, "loss": 0.0725, "lr": 0.01514590874279999, "epoch": 1.6725136198177508, "percentage": 85.58, "elapsed_time": "1 day, 12:17:12", "remaining_time": "6:07:00", "throughput": 331.79, "total_tokens": 43342016} {"current_steps": 34235, "total_steps": 40000, "loss": 0.0476, "lr": 0.015120125136285467, "epoch": 1.6727579214814452, "percentage": 85.59, "elapsed_time": "1 day, 12:17:15", "remaining_time": "6:06:38", "throughput": 331.83, "total_tokens": 43348224} {"current_steps": 34240, "total_steps": 40000, "loss": 0.0499, "lr": 0.015094362329942629, "epoch": 1.6730022231451396, "percentage": 85.6, "elapsed_time": "1 day, 12:17:18", "remaining_time": "6:06:16", "throughput": 331.87, "total_tokens": 43354432} {"current_steps": 34245, "total_steps": 40000, "loss": 0.0613, "lr": 0.01506862032774448, "epoch": 1.673246524808834, "percentage": 85.61, "elapsed_time": "1 day, 12:17:21", "remaining_time": "6:05:54", "throughput": 331.91, "total_tokens": 43360768} {"current_steps": 34250, "total_steps": 40000, "loss": 0.0473, "lr": 0.015042899133660697, "epoch": 1.6734908264725283, "percentage": 85.62, "elapsed_time": "1 day, 12:17:24", "remaining_time": "6:05:32", "throughput": 331.95, "total_tokens": 43367168} {"current_steps": 34255, "total_steps": 40000, "loss": 0.0729, "lr": 0.01501719875165789, "epoch": 1.6737351281362227, "percentage": 85.64, "elapsed_time": "1 day, 12:17:27", "remaining_time": "6:05:11", "throughput": 331.99, "total_tokens": 43373376} {"current_steps": 34260, "total_steps": 40000, "loss": 0.0323, "lr": 0.014991519185699286, "epoch": 1.673979429799917, "percentage": 85.65, "elapsed_time": "1 day, 12:17:30", "remaining_time": "6:04:49", "throughput": 332.03, "total_tokens": 43380224} {"current_steps": 34265, "total_steps": 40000, "loss": 0.0408, "lr": 0.014965860439745054, "epoch": 1.6742237314636113, "percentage": 85.66, "elapsed_time": "1 day, 12:17:33", "remaining_time": "6:04:27", "throughput": 332.07, "total_tokens": 43386176} {"current_steps": 34270, "total_steps": 40000, "loss": 0.0562, "lr": 0.01494022251775211, "epoch": 1.6744680331273056, "percentage": 85.67, "elapsed_time": "1 day, 12:17:36", "remaining_time": "6:04:06", "throughput": 332.11, "total_tokens": 43392608} {"current_steps": 34275, "total_steps": 40000, "loss": 0.0513, "lr": 0.014914605423674109, "epoch": 1.6747123347909998, "percentage": 85.69, "elapsed_time": "1 day, 12:17:39", "remaining_time": "6:03:44", "throughput": 332.15, "total_tokens": 43399040} {"current_steps": 34280, "total_steps": 40000, "loss": 0.0524, "lr": 0.014889009161461525, "epoch": 1.6749566364546942, "percentage": 85.7, "elapsed_time": "1 day, 12:17:42", "remaining_time": "6:03:22", "throughput": 332.19, "total_tokens": 43405472} {"current_steps": 34285, "total_steps": 40000, "loss": 0.0767, "lr": 0.014863433735061665, "epoch": 1.6752009381183885, "percentage": 85.71, "elapsed_time": "1 day, 12:17:45", "remaining_time": "6:03:00", "throughput": 332.23, "total_tokens": 43411680} {"current_steps": 34290, "total_steps": 40000, "loss": 0.0457, "lr": 0.014837879148418541, "epoch": 1.675445239782083, "percentage": 85.72, "elapsed_time": "1 day, 12:17:48", "remaining_time": "6:02:39", "throughput": 332.28, "total_tokens": 43418240} {"current_steps": 34295, "total_steps": 40000, "loss": 0.0471, "lr": 0.01481234540547302, "epoch": 1.6756895414457773, "percentage": 85.74, "elapsed_time": "1 day, 12:17:52", "remaining_time": "6:02:17", "throughput": 332.32, "total_tokens": 43424672} {"current_steps": 34300, "total_steps": 40000, "loss": 0.0644, "lr": 0.014786832510162717, "epoch": 1.6759338431094717, "percentage": 85.75, "elapsed_time": "1 day, 12:17:55", "remaining_time": "6:01:55", "throughput": 332.36, "total_tokens": 43431200} {"current_steps": 34305, "total_steps": 40000, "loss": 0.0734, "lr": 0.014761340466422017, "epoch": 1.676178144773166, "percentage": 85.76, "elapsed_time": "1 day, 12:17:58", "remaining_time": "6:01:33", "throughput": 332.4, "total_tokens": 43437248} {"current_steps": 34310, "total_steps": 40000, "loss": 0.0531, "lr": 0.014735869278182144, "epoch": 1.6764224464368602, "percentage": 85.78, "elapsed_time": "1 day, 12:18:01", "remaining_time": "6:01:12", "throughput": 332.44, "total_tokens": 43443424} {"current_steps": 34315, "total_steps": 40000, "loss": 0.0499, "lr": 0.014710418949371057, "epoch": 1.6766667481005546, "percentage": 85.79, "elapsed_time": "1 day, 12:18:04", "remaining_time": "6:00:50", "throughput": 332.48, "total_tokens": 43449984} {"current_steps": 34320, "total_steps": 40000, "loss": 0.0517, "lr": 0.014684989483913495, "epoch": 1.6769110497642488, "percentage": 85.8, "elapsed_time": "1 day, 12:18:07", "remaining_time": "6:00:28", "throughput": 332.52, "total_tokens": 43456736} {"current_steps": 34325, "total_steps": 40000, "loss": 0.0526, "lr": 0.014659580885731077, "epoch": 1.6771553514279431, "percentage": 85.81, "elapsed_time": "1 day, 12:18:10", "remaining_time": "6:00:07", "throughput": 332.56, "total_tokens": 43463072} {"current_steps": 34330, "total_steps": 40000, "loss": 0.0813, "lr": 0.014634193158742047, "epoch": 1.6773996530916375, "percentage": 85.82, "elapsed_time": "1 day, 12:18:13", "remaining_time": "5:59:45", "throughput": 332.6, "total_tokens": 43469280} {"current_steps": 34335, "total_steps": 40000, "loss": 0.0556, "lr": 0.014608826306861576, "epoch": 1.677643954755332, "percentage": 85.84, "elapsed_time": "1 day, 12:18:16", "remaining_time": "5:59:23", "throughput": 332.65, "total_tokens": 43475936} {"current_steps": 34340, "total_steps": 40000, "loss": 0.0369, "lr": 0.014583480334001486, "epoch": 1.6778882564190263, "percentage": 85.85, "elapsed_time": "1 day, 12:18:19", "remaining_time": "5:59:02", "throughput": 332.69, "total_tokens": 43482176} {"current_steps": 34345, "total_steps": 40000, "loss": 0.038, "lr": 0.014558155244070496, "epoch": 1.6781325580827207, "percentage": 85.86, "elapsed_time": "1 day, 12:18:22", "remaining_time": "5:58:40", "throughput": 332.73, "total_tokens": 43488864} {"current_steps": 34350, "total_steps": 40000, "loss": 0.0702, "lr": 0.014532851040974036, "epoch": 1.678376859746415, "percentage": 85.88, "elapsed_time": "1 day, 12:18:25", "remaining_time": "5:58:18", "throughput": 332.77, "total_tokens": 43494720} {"current_steps": 34355, "total_steps": 40000, "loss": 0.0627, "lr": 0.014507567728614335, "epoch": 1.6786211614101092, "percentage": 85.89, "elapsed_time": "1 day, 12:18:28", "remaining_time": "5:57:57", "throughput": 332.81, "total_tokens": 43500800} {"current_steps": 34360, "total_steps": 40000, "loss": 0.0703, "lr": 0.01448230531089037, "epoch": 1.6788654630738036, "percentage": 85.9, "elapsed_time": "1 day, 12:18:31", "remaining_time": "5:57:35", "throughput": 332.85, "total_tokens": 43506912} {"current_steps": 34365, "total_steps": 40000, "loss": 0.0336, "lr": 0.014457063791697993, "epoch": 1.6791097647374977, "percentage": 85.91, "elapsed_time": "1 day, 12:18:35", "remaining_time": "5:57:14", "throughput": 332.89, "total_tokens": 43513696} {"current_steps": 34370, "total_steps": 40000, "loss": 0.0527, "lr": 0.01443184317492971, "epoch": 1.6793540664011921, "percentage": 85.92, "elapsed_time": "1 day, 12:18:38", "remaining_time": "5:56:52", "throughput": 332.93, "total_tokens": 43520448} {"current_steps": 34375, "total_steps": 40000, "loss": 0.0534, "lr": 0.014406643464474822, "epoch": 1.6795983680648865, "percentage": 85.94, "elapsed_time": "1 day, 12:18:41", "remaining_time": "5:56:30", "throughput": 332.97, "total_tokens": 43526400} {"current_steps": 34380, "total_steps": 40000, "loss": 0.0935, "lr": 0.014381464664219539, "epoch": 1.6798426697285809, "percentage": 85.95, "elapsed_time": "1 day, 12:18:44", "remaining_time": "5:56:09", "throughput": 333.01, "total_tokens": 43532800} {"current_steps": 34385, "total_steps": 40000, "loss": 0.079, "lr": 0.014356306778046656, "epoch": 1.6800869713922753, "percentage": 85.96, "elapsed_time": "1 day, 12:18:47", "remaining_time": "5:55:47", "throughput": 333.05, "total_tokens": 43538656} {"current_steps": 34390, "total_steps": 40000, "loss": 0.0644, "lr": 0.014331169809835885, "epoch": 1.6803312730559696, "percentage": 85.97, "elapsed_time": "1 day, 12:18:50", "remaining_time": "5:55:25", "throughput": 333.09, "total_tokens": 43544736} {"current_steps": 34395, "total_steps": 40000, "loss": 0.0403, "lr": 0.014306053763463644, "epoch": 1.6805755747196638, "percentage": 85.99, "elapsed_time": "1 day, 12:18:53", "remaining_time": "5:55:04", "throughput": 333.13, "total_tokens": 43550720} {"current_steps": 34400, "total_steps": 40000, "loss": 0.0574, "lr": 0.014280958642803147, "epoch": 1.6808198763833582, "percentage": 86.0, "elapsed_time": "1 day, 12:18:56", "remaining_time": "5:54:42", "throughput": 333.16, "total_tokens": 43556672} {"current_steps": 34400, "total_steps": 40000, "eval_loss": 0.06061418354511261, "epoch": 1.6808198763833582, "percentage": 86.0, "elapsed_time": "1 day, 12:29:30", "remaining_time": "5:56:25", "throughput": 331.56, "total_tokens": 43556672} {"current_steps": 34405, "total_steps": 40000, "loss": 0.0845, "lr": 0.014255884451724404, "epoch": 1.6810641780470525, "percentage": 86.01, "elapsed_time": "1 day, 12:29:34", "remaining_time": "5:56:04", "throughput": 331.59, "total_tokens": 43562880} {"current_steps": 34410, "total_steps": 40000, "loss": 0.0342, "lr": 0.014230831194094101, "epoch": 1.6813084797107467, "percentage": 86.02, "elapsed_time": "1 day, 12:29:37", "remaining_time": "5:55:42", "throughput": 331.63, "total_tokens": 43569408} {"current_steps": 34415, "total_steps": 40000, "loss": 0.0834, "lr": 0.014205798873775865, "epoch": 1.681552781374441, "percentage": 86.04, "elapsed_time": "1 day, 12:29:40", "remaining_time": "5:55:20", "throughput": 331.67, "total_tokens": 43575328} {"current_steps": 34420, "total_steps": 40000, "loss": 0.0709, "lr": 0.014180787494629893, "epoch": 1.6817970830381355, "percentage": 86.05, "elapsed_time": "1 day, 12:29:43", "remaining_time": "5:54:59", "throughput": 331.71, "total_tokens": 43581792} {"current_steps": 34425, "total_steps": 40000, "loss": 0.0848, "lr": 0.014155797060513314, "epoch": 1.6820413847018298, "percentage": 86.06, "elapsed_time": "1 day, 12:29:46", "remaining_time": "5:54:37", "throughput": 331.76, "total_tokens": 43588256} {"current_steps": 34430, "total_steps": 40000, "loss": 0.0562, "lr": 0.014130827575279963, "epoch": 1.6822856863655242, "percentage": 86.08, "elapsed_time": "1 day, 12:29:49", "remaining_time": "5:54:15", "throughput": 331.8, "total_tokens": 43594592} {"current_steps": 34435, "total_steps": 40000, "loss": 0.0585, "lr": 0.014105879042780427, "epoch": 1.6825299880292186, "percentage": 86.09, "elapsed_time": "1 day, 12:29:52", "remaining_time": "5:53:54", "throughput": 331.84, "total_tokens": 43600896} {"current_steps": 34440, "total_steps": 40000, "loss": 0.0623, "lr": 0.014080951466862113, "epoch": 1.6827742896929128, "percentage": 86.1, "elapsed_time": "1 day, 12:29:56", "remaining_time": "5:53:32", "throughput": 331.88, "total_tokens": 43607136} {"current_steps": 34445, "total_steps": 40000, "loss": 0.0681, "lr": 0.014056044851369126, "epoch": 1.6830185913566071, "percentage": 86.11, "elapsed_time": "1 day, 12:29:59", "remaining_time": "5:53:10", "throughput": 331.91, "total_tokens": 43613312} {"current_steps": 34450, "total_steps": 40000, "loss": 0.09, "lr": 0.014031159200142428, "epoch": 1.6832628930203015, "percentage": 86.12, "elapsed_time": "1 day, 12:30:02", "remaining_time": "5:52:49", "throughput": 331.95, "total_tokens": 43619424} {"current_steps": 34455, "total_steps": 40000, "loss": 0.0327, "lr": 0.014006294517019667, "epoch": 1.6835071946839957, "percentage": 86.14, "elapsed_time": "1 day, 12:30:05", "remaining_time": "5:52:27", "throughput": 332.0, "total_tokens": 43626272} {"current_steps": 34460, "total_steps": 40000, "loss": 0.0645, "lr": 0.013981450805835276, "epoch": 1.68375149634769, "percentage": 86.15, "elapsed_time": "1 day, 12:30:08", "remaining_time": "5:52:06", "throughput": 332.04, "total_tokens": 43633024} {"current_steps": 34465, "total_steps": 40000, "loss": 0.0396, "lr": 0.01395662807042049, "epoch": 1.6839957980113844, "percentage": 86.16, "elapsed_time": "1 day, 12:30:11", "remaining_time": "5:51:44", "throughput": 332.08, "total_tokens": 43639392} {"current_steps": 34470, "total_steps": 40000, "loss": 0.0501, "lr": 0.013931826314603296, "epoch": 1.6842400996750788, "percentage": 86.17, "elapsed_time": "1 day, 12:30:14", "remaining_time": "5:51:22", "throughput": 332.12, "total_tokens": 43645600} {"current_steps": 34475, "total_steps": 40000, "loss": 0.0626, "lr": 0.013907045542208401, "epoch": 1.6844844013387732, "percentage": 86.19, "elapsed_time": "1 day, 12:30:17", "remaining_time": "5:51:01", "throughput": 332.16, "total_tokens": 43651936} {"current_steps": 34480, "total_steps": 40000, "loss": 0.0514, "lr": 0.013882285757057333, "epoch": 1.6847287030024676, "percentage": 86.2, "elapsed_time": "1 day, 12:30:20", "remaining_time": "5:50:39", "throughput": 332.2, "total_tokens": 43657984} {"current_steps": 34485, "total_steps": 40000, "loss": 0.062, "lr": 0.013857546962968403, "epoch": 1.6849730046661617, "percentage": 86.21, "elapsed_time": "1 day, 12:30:23", "remaining_time": "5:50:17", "throughput": 332.24, "total_tokens": 43664224} {"current_steps": 34490, "total_steps": 40000, "loss": 0.0662, "lr": 0.013832829163756577, "epoch": 1.6852173063298561, "percentage": 86.22, "elapsed_time": "1 day, 12:30:26", "remaining_time": "5:49:56", "throughput": 332.28, "total_tokens": 43670624} {"current_steps": 34495, "total_steps": 40000, "loss": 0.0497, "lr": 0.013808132363233689, "epoch": 1.6854616079935503, "percentage": 86.24, "elapsed_time": "1 day, 12:30:29", "remaining_time": "5:49:34", "throughput": 332.32, "total_tokens": 43676640} {"current_steps": 34500, "total_steps": 40000, "loss": 0.0555, "lr": 0.013783456565208256, "epoch": 1.6857059096572446, "percentage": 86.25, "elapsed_time": "1 day, 12:30:32", "remaining_time": "5:49:13", "throughput": 332.36, "total_tokens": 43683200} {"current_steps": 34505, "total_steps": 40000, "loss": 0.0955, "lr": 0.01375880177348564, "epoch": 1.685950211320939, "percentage": 86.26, "elapsed_time": "1 day, 12:30:36", "remaining_time": "5:48:51", "throughput": 332.4, "total_tokens": 43689696} {"current_steps": 34510, "total_steps": 40000, "loss": 0.0571, "lr": 0.013734167991867928, "epoch": 1.6861945129846334, "percentage": 86.28, "elapsed_time": "1 day, 12:30:39", "remaining_time": "5:48:29", "throughput": 332.44, "total_tokens": 43696032} {"current_steps": 34515, "total_steps": 40000, "loss": 0.0526, "lr": 0.013709555224153935, "epoch": 1.6864388146483278, "percentage": 86.29, "elapsed_time": "1 day, 12:30:42", "remaining_time": "5:48:08", "throughput": 332.48, "total_tokens": 43702272} {"current_steps": 34520, "total_steps": 40000, "loss": 0.0672, "lr": 0.013684963474139222, "epoch": 1.6866831163120222, "percentage": 86.3, "elapsed_time": "1 day, 12:30:45", "remaining_time": "5:47:46", "throughput": 332.52, "total_tokens": 43708480} {"current_steps": 34525, "total_steps": 40000, "loss": 0.0507, "lr": 0.013660392745616224, "epoch": 1.6869274179757165, "percentage": 86.31, "elapsed_time": "1 day, 12:30:48", "remaining_time": "5:47:25", "throughput": 332.57, "total_tokens": 43715136} {"current_steps": 34530, "total_steps": 40000, "loss": 0.0381, "lr": 0.013635843042373974, "epoch": 1.6871717196394107, "percentage": 86.33, "elapsed_time": "1 day, 12:30:51", "remaining_time": "5:47:03", "throughput": 332.6, "total_tokens": 43720960} {"current_steps": 34535, "total_steps": 40000, "loss": 0.0604, "lr": 0.01361131436819843, "epoch": 1.687416021303105, "percentage": 86.34, "elapsed_time": "1 day, 12:30:54", "remaining_time": "5:46:42", "throughput": 332.64, "total_tokens": 43726752} {"current_steps": 34540, "total_steps": 40000, "loss": 0.0642, "lr": 0.013586806726872147, "epoch": 1.6876603229667992, "percentage": 86.35, "elapsed_time": "1 day, 12:30:57", "remaining_time": "5:46:20", "throughput": 332.68, "total_tokens": 43732576} {"current_steps": 34545, "total_steps": 40000, "loss": 0.0251, "lr": 0.013562320122174537, "epoch": 1.6879046246304936, "percentage": 86.36, "elapsed_time": "1 day, 12:31:00", "remaining_time": "5:45:58", "throughput": 332.71, "total_tokens": 43738816} {"current_steps": 34550, "total_steps": 40000, "loss": 0.0488, "lr": 0.013537854557881762, "epoch": 1.688148926294188, "percentage": 86.38, "elapsed_time": "1 day, 12:31:03", "remaining_time": "5:45:37", "throughput": 332.75, "total_tokens": 43744992} {"current_steps": 34555, "total_steps": 40000, "loss": 0.0735, "lr": 0.013513410037766687, "epoch": 1.6883932279578824, "percentage": 86.39, "elapsed_time": "1 day, 12:31:06", "remaining_time": "5:45:15", "throughput": 332.79, "total_tokens": 43751296} {"current_steps": 34560, "total_steps": 40000, "loss": 0.0701, "lr": 0.013488986565598998, "epoch": 1.6886375296215768, "percentage": 86.4, "elapsed_time": "1 day, 12:31:09", "remaining_time": "5:44:54", "throughput": 332.84, "total_tokens": 43757856} {"current_steps": 34565, "total_steps": 40000, "loss": 0.0469, "lr": 0.013464584145145097, "epoch": 1.6888818312852711, "percentage": 86.41, "elapsed_time": "1 day, 12:31:12", "remaining_time": "5:44:32", "throughput": 332.88, "total_tokens": 43764192} {"current_steps": 34570, "total_steps": 40000, "loss": 0.0732, "lr": 0.013440202780168109, "epoch": 1.6891261329489655, "percentage": 86.42, "elapsed_time": "1 day, 12:31:15", "remaining_time": "5:44:11", "throughput": 332.92, "total_tokens": 43771200} {"current_steps": 34575, "total_steps": 40000, "loss": 0.0591, "lr": 0.01341584247442799, "epoch": 1.6893704346126597, "percentage": 86.44, "elapsed_time": "1 day, 12:31:19", "remaining_time": "5:43:49", "throughput": 332.97, "total_tokens": 43778016} {"current_steps": 34580, "total_steps": 40000, "loss": 0.0799, "lr": 0.013391503231681355, "epoch": 1.689614736276354, "percentage": 86.45, "elapsed_time": "1 day, 12:31:22", "remaining_time": "5:43:28", "throughput": 333.0, "total_tokens": 43783936} {"current_steps": 34585, "total_steps": 40000, "loss": 0.0423, "lr": 0.013367185055681685, "epoch": 1.6898590379400482, "percentage": 86.46, "elapsed_time": "1 day, 12:31:25", "remaining_time": "5:43:06", "throughput": 333.04, "total_tokens": 43790176} {"current_steps": 34590, "total_steps": 40000, "loss": 0.0383, "lr": 0.013342887950179095, "epoch": 1.6901033396037426, "percentage": 86.48, "elapsed_time": "1 day, 12:31:28", "remaining_time": "5:42:45", "throughput": 333.08, "total_tokens": 43796640} {"current_steps": 34595, "total_steps": 40000, "loss": 0.0616, "lr": 0.013318611918920554, "epoch": 1.690347641267437, "percentage": 86.49, "elapsed_time": "1 day, 12:31:31", "remaining_time": "5:42:23", "throughput": 333.12, "total_tokens": 43802784} {"current_steps": 34600, "total_steps": 40000, "loss": 0.052, "lr": 0.01329435696564965, "epoch": 1.6905919429311314, "percentage": 86.5, "elapsed_time": "1 day, 12:31:34", "remaining_time": "5:42:02", "throughput": 333.16, "total_tokens": 43809088} {"current_steps": 34600, "total_steps": 40000, "eval_loss": 0.06073778495192528, "epoch": 1.6905919429311314, "percentage": 86.5, "elapsed_time": "1 day, 12:42:08", "remaining_time": "5:43:41", "throughput": 331.56, "total_tokens": 43809088} {"current_steps": 34605, "total_steps": 40000, "loss": 0.0687, "lr": 0.013270123094106894, "epoch": 1.6908362445948257, "percentage": 86.51, "elapsed_time": "1 day, 12:42:12", "remaining_time": "5:43:19", "throughput": 331.6, "total_tokens": 43815232} {"current_steps": 34610, "total_steps": 40000, "loss": 0.0729, "lr": 0.013245910308029395, "epoch": 1.6910805462585201, "percentage": 86.52, "elapsed_time": "1 day, 12:42:15", "remaining_time": "5:42:58", "throughput": 331.64, "total_tokens": 43821472} {"current_steps": 34615, "total_steps": 40000, "loss": 0.0327, "lr": 0.0132217186111511, "epoch": 1.6913248479222145, "percentage": 86.54, "elapsed_time": "1 day, 12:42:18", "remaining_time": "5:42:36", "throughput": 331.68, "total_tokens": 43827680} {"current_steps": 34620, "total_steps": 40000, "loss": 0.0405, "lr": 0.013197548007202626, "epoch": 1.6915691495859086, "percentage": 86.55, "elapsed_time": "1 day, 12:42:21", "remaining_time": "5:42:15", "throughput": 331.72, "total_tokens": 43834080} {"current_steps": 34625, "total_steps": 40000, "loss": 0.0668, "lr": 0.01317339849991142, "epoch": 1.691813451249603, "percentage": 86.56, "elapsed_time": "1 day, 12:42:24", "remaining_time": "5:41:53", "throughput": 331.76, "total_tokens": 43840032} {"current_steps": 34630, "total_steps": 40000, "loss": 0.0699, "lr": 0.013149270093001675, "epoch": 1.6920577529132972, "percentage": 86.58, "elapsed_time": "1 day, 12:42:27", "remaining_time": "5:41:31", "throughput": 331.8, "total_tokens": 43846080} {"current_steps": 34635, "total_steps": 40000, "loss": 0.0483, "lr": 0.013125162790194227, "epoch": 1.6923020545769916, "percentage": 86.59, "elapsed_time": "1 day, 12:42:30", "remaining_time": "5:41:10", "throughput": 331.84, "total_tokens": 43852640} {"current_steps": 34640, "total_steps": 40000, "loss": 0.052, "lr": 0.01310107659520674, "epoch": 1.692546356240686, "percentage": 86.6, "elapsed_time": "1 day, 12:42:33", "remaining_time": "5:40:48", "throughput": 331.88, "total_tokens": 43858976} {"current_steps": 34645, "total_steps": 40000, "loss": 0.0513, "lr": 0.013077011511753655, "epoch": 1.6927906579043803, "percentage": 86.61, "elapsed_time": "1 day, 12:42:36", "remaining_time": "5:40:27", "throughput": 331.92, "total_tokens": 43865440} {"current_steps": 34650, "total_steps": 40000, "loss": 0.0662, "lr": 0.013052967543546056, "epoch": 1.6930349595680747, "percentage": 86.62, "elapsed_time": "1 day, 12:42:39", "remaining_time": "5:40:05", "throughput": 331.96, "total_tokens": 43871200} {"current_steps": 34655, "total_steps": 40000, "loss": 0.0418, "lr": 0.01302894469429186, "epoch": 1.693279261231769, "percentage": 86.64, "elapsed_time": "1 day, 12:42:42", "remaining_time": "5:39:44", "throughput": 332.0, "total_tokens": 43877600} {"current_steps": 34660, "total_steps": 40000, "loss": 0.0436, "lr": 0.013004942967695653, "epoch": 1.6935235628954635, "percentage": 86.65, "elapsed_time": "1 day, 12:42:46", "remaining_time": "5:39:22", "throughput": 332.04, "total_tokens": 43884256} {"current_steps": 34665, "total_steps": 40000, "loss": 0.1021, "lr": 0.012980962367458859, "epoch": 1.6937678645591576, "percentage": 86.66, "elapsed_time": "1 day, 12:42:49", "remaining_time": "5:39:01", "throughput": 332.08, "total_tokens": 43890368} {"current_steps": 34670, "total_steps": 40000, "loss": 0.0593, "lr": 0.012957002897279567, "epoch": 1.694012166222852, "percentage": 86.67, "elapsed_time": "1 day, 12:42:52", "remaining_time": "5:38:39", "throughput": 332.11, "total_tokens": 43895968} {"current_steps": 34675, "total_steps": 40000, "loss": 0.0569, "lr": 0.012933064560852576, "epoch": 1.6942564678865462, "percentage": 86.69, "elapsed_time": "1 day, 12:42:55", "remaining_time": "5:38:17", "throughput": 332.15, "total_tokens": 43902080} {"current_steps": 34680, "total_steps": 40000, "loss": 0.0694, "lr": 0.012909147361869527, "epoch": 1.6945007695502405, "percentage": 86.7, "elapsed_time": "1 day, 12:42:58", "remaining_time": "5:37:56", "throughput": 332.19, "total_tokens": 43907936} {"current_steps": 34685, "total_steps": 40000, "loss": 0.0338, "lr": 0.012885251304018774, "epoch": 1.694745071213935, "percentage": 86.71, "elapsed_time": "1 day, 12:43:01", "remaining_time": "5:37:34", "throughput": 332.23, "total_tokens": 43914528} {"current_steps": 34690, "total_steps": 40000, "loss": 0.0519, "lr": 0.012861376390985335, "epoch": 1.6949893728776293, "percentage": 86.72, "elapsed_time": "1 day, 12:43:04", "remaining_time": "5:37:13", "throughput": 332.27, "total_tokens": 43920992} {"current_steps": 34695, "total_steps": 40000, "loss": 0.0378, "lr": 0.012837522626451063, "epoch": 1.6952336745413237, "percentage": 86.74, "elapsed_time": "1 day, 12:43:07", "remaining_time": "5:36:51", "throughput": 332.31, "total_tokens": 43927328} {"current_steps": 34700, "total_steps": 40000, "loss": 0.0683, "lr": 0.01281369001409447, "epoch": 1.695477976205018, "percentage": 86.75, "elapsed_time": "1 day, 12:43:10", "remaining_time": "5:36:30", "throughput": 332.35, "total_tokens": 43933600} {"current_steps": 34705, "total_steps": 40000, "loss": 0.0524, "lr": 0.012789878557590877, "epoch": 1.6957222778687124, "percentage": 86.76, "elapsed_time": "1 day, 12:43:13", "remaining_time": "5:36:08", "throughput": 332.39, "total_tokens": 43939776} {"current_steps": 34710, "total_steps": 40000, "loss": 0.059, "lr": 0.012766088260612334, "epoch": 1.6959665795324066, "percentage": 86.78, "elapsed_time": "1 day, 12:43:16", "remaining_time": "5:35:47", "throughput": 332.43, "total_tokens": 43946240} {"current_steps": 34715, "total_steps": 40000, "loss": 0.0515, "lr": 0.012742319126827523, "epoch": 1.696210881196101, "percentage": 86.79, "elapsed_time": "1 day, 12:43:19", "remaining_time": "5:35:25", "throughput": 332.47, "total_tokens": 43952224} {"current_steps": 34720, "total_steps": 40000, "loss": 0.0614, "lr": 0.012718571159902008, "epoch": 1.6964551828597951, "percentage": 86.8, "elapsed_time": "1 day, 12:43:22", "remaining_time": "5:35:04", "throughput": 332.51, "total_tokens": 43958752} {"current_steps": 34725, "total_steps": 40000, "loss": 0.0645, "lr": 0.01269484436349803, "epoch": 1.6966994845234895, "percentage": 86.81, "elapsed_time": "1 day, 12:43:25", "remaining_time": "5:34:43", "throughput": 332.55, "total_tokens": 43965152} {"current_steps": 34730, "total_steps": 40000, "loss": 0.0373, "lr": 0.012671138741274528, "epoch": 1.696943786187184, "percentage": 86.83, "elapsed_time": "1 day, 12:43:28", "remaining_time": "5:34:21", "throughput": 332.59, "total_tokens": 43971680} {"current_steps": 34735, "total_steps": 40000, "loss": 0.0466, "lr": 0.012647454296887194, "epoch": 1.6971880878508783, "percentage": 86.84, "elapsed_time": "1 day, 12:43:31", "remaining_time": "5:34:00", "throughput": 332.64, "total_tokens": 43978432} {"current_steps": 34740, "total_steps": 40000, "loss": 0.052, "lr": 0.012623791033988507, "epoch": 1.6974323895145726, "percentage": 86.85, "elapsed_time": "1 day, 12:43:34", "remaining_time": "5:33:38", "throughput": 332.68, "total_tokens": 43984768} {"current_steps": 34745, "total_steps": 40000, "loss": 0.0671, "lr": 0.012600148956227597, "epoch": 1.697676691178267, "percentage": 86.86, "elapsed_time": "1 day, 12:43:37", "remaining_time": "5:33:17", "throughput": 332.72, "total_tokens": 43990912} {"current_steps": 34750, "total_steps": 40000, "loss": 0.05, "lr": 0.012576528067250414, "epoch": 1.6979209928419614, "percentage": 86.88, "elapsed_time": "1 day, 12:43:40", "remaining_time": "5:32:55", "throughput": 332.75, "total_tokens": 43996768} {"current_steps": 34755, "total_steps": 40000, "loss": 0.065, "lr": 0.012552928370699561, "epoch": 1.6981652945056556, "percentage": 86.89, "elapsed_time": "1 day, 12:43:43", "remaining_time": "5:32:34", "throughput": 332.79, "total_tokens": 44002880} {"current_steps": 34760, "total_steps": 40000, "loss": 0.055, "lr": 0.012529349870214411, "epoch": 1.69840959616935, "percentage": 86.9, "elapsed_time": "1 day, 12:43:47", "remaining_time": "5:32:12", "throughput": 332.83, "total_tokens": 44009440} {"current_steps": 34765, "total_steps": 40000, "loss": 0.0595, "lr": 0.012505792569431106, "epoch": 1.698653897833044, "percentage": 86.91, "elapsed_time": "1 day, 12:43:50", "remaining_time": "5:31:51", "throughput": 332.87, "total_tokens": 44015808} {"current_steps": 34770, "total_steps": 40000, "loss": 0.05, "lr": 0.012482256471982422, "epoch": 1.6988981994967385, "percentage": 86.92, "elapsed_time": "1 day, 12:43:53", "remaining_time": "5:31:30", "throughput": 332.91, "total_tokens": 44022080} {"current_steps": 34775, "total_steps": 40000, "loss": 0.0418, "lr": 0.012458741581497956, "epoch": 1.6991425011604329, "percentage": 86.94, "elapsed_time": "1 day, 12:43:56", "remaining_time": "5:31:08", "throughput": 332.95, "total_tokens": 44028128} {"current_steps": 34780, "total_steps": 40000, "loss": 0.0376, "lr": 0.012435247901603974, "epoch": 1.6993868028241272, "percentage": 86.95, "elapsed_time": "1 day, 12:43:59", "remaining_time": "5:30:47", "throughput": 332.99, "total_tokens": 44034528} {"current_steps": 34785, "total_steps": 40000, "loss": 0.0525, "lr": 0.012411775435923528, "epoch": 1.6996311044878216, "percentage": 86.96, "elapsed_time": "1 day, 12:44:02", "remaining_time": "5:30:25", "throughput": 333.03, "total_tokens": 44040896} {"current_steps": 34790, "total_steps": 40000, "loss": 0.0689, "lr": 0.012388324188076354, "epoch": 1.699875406151516, "percentage": 86.98, "elapsed_time": "1 day, 12:44:05", "remaining_time": "5:30:04", "throughput": 333.07, "total_tokens": 44046816} {"current_steps": 34795, "total_steps": 40000, "loss": 0.0723, "lr": 0.012364894161678913, "epoch": 1.7001197078152104, "percentage": 86.99, "elapsed_time": "1 day, 12:44:08", "remaining_time": "5:29:43", "throughput": 333.11, "total_tokens": 44053056} {"current_steps": 34800, "total_steps": 40000, "loss": 0.0307, "lr": 0.012341485360344445, "epoch": 1.7003640094789045, "percentage": 87.0, "elapsed_time": "1 day, 12:44:11", "remaining_time": "5:29:21", "throughput": 333.15, "total_tokens": 44059712} {"current_steps": 34800, "total_steps": 40000, "eval_loss": 0.060834601521492004, "epoch": 1.7003640094789045, "percentage": 87.0, "elapsed_time": "1 day, 12:54:45", "remaining_time": "5:30:56", "throughput": 331.56, "total_tokens": 44059712} {"current_steps": 34805, "total_steps": 40000, "loss": 0.0523, "lr": 0.01231809778768283, "epoch": 1.700608311142599, "percentage": 87.01, "elapsed_time": "1 day, 12:54:49", "remaining_time": "5:30:35", "throughput": 331.6, "total_tokens": 44066240} {"current_steps": 34810, "total_steps": 40000, "loss": 0.0769, "lr": 0.012294731447300799, "epoch": 1.700852612806293, "percentage": 87.02, "elapsed_time": "1 day, 12:54:52", "remaining_time": "5:30:13", "throughput": 331.64, "total_tokens": 44072384} {"current_steps": 34815, "total_steps": 40000, "loss": 0.0707, "lr": 0.012271386342801671, "epoch": 1.7010969144699875, "percentage": 87.04, "elapsed_time": "1 day, 12:54:55", "remaining_time": "5:29:52", "throughput": 331.68, "total_tokens": 44078656} {"current_steps": 34820, "total_steps": 40000, "loss": 0.0791, "lr": 0.012248062477785565, "epoch": 1.7013412161336818, "percentage": 87.05, "elapsed_time": "1 day, 12:54:58", "remaining_time": "5:29:30", "throughput": 331.72, "total_tokens": 44084704} {"current_steps": 34825, "total_steps": 40000, "loss": 0.0665, "lr": 0.012224759855849305, "epoch": 1.7015855177973762, "percentage": 87.06, "elapsed_time": "1 day, 12:55:01", "remaining_time": "5:29:09", "throughput": 331.76, "total_tokens": 44090848} {"current_steps": 34830, "total_steps": 40000, "loss": 0.0516, "lr": 0.012201478480586513, "epoch": 1.7018298194610706, "percentage": 87.08, "elapsed_time": "1 day, 12:55:04", "remaining_time": "5:28:47", "throughput": 331.8, "total_tokens": 44096960} {"current_steps": 34835, "total_steps": 40000, "loss": 0.0458, "lr": 0.012178218355587389, "epoch": 1.702074121124765, "percentage": 87.09, "elapsed_time": "1 day, 12:55:07", "remaining_time": "5:28:26", "throughput": 331.84, "total_tokens": 44103840} {"current_steps": 34840, "total_steps": 40000, "loss": 0.0478, "lr": 0.01215497948443896, "epoch": 1.7023184227884594, "percentage": 87.1, "elapsed_time": "1 day, 12:55:10", "remaining_time": "5:28:04", "throughput": 331.88, "total_tokens": 44110016} {"current_steps": 34845, "total_steps": 40000, "loss": 0.0712, "lr": 0.012131761870724993, "epoch": 1.7025627244521535, "percentage": 87.11, "elapsed_time": "1 day, 12:55:13", "remaining_time": "5:27:43", "throughput": 331.92, "total_tokens": 44116928} {"current_steps": 34850, "total_steps": 40000, "loss": 0.0636, "lr": 0.012108565518025893, "epoch": 1.7028070261158479, "percentage": 87.12, "elapsed_time": "1 day, 12:55:16", "remaining_time": "5:27:21", "throughput": 331.96, "total_tokens": 44123680} {"current_steps": 34855, "total_steps": 40000, "loss": 0.0655, "lr": 0.012085390429918862, "epoch": 1.703051327779542, "percentage": 87.14, "elapsed_time": "1 day, 12:55:19", "remaining_time": "5:27:00", "throughput": 332.01, "total_tokens": 44130112} {"current_steps": 34860, "total_steps": 40000, "loss": 0.062, "lr": 0.012062236609977744, "epoch": 1.7032956294432364, "percentage": 87.15, "elapsed_time": "1 day, 12:55:23", "remaining_time": "5:26:39", "throughput": 332.05, "total_tokens": 44136768} {"current_steps": 34865, "total_steps": 40000, "loss": 0.0521, "lr": 0.01203910406177318, "epoch": 1.7035399311069308, "percentage": 87.16, "elapsed_time": "1 day, 12:55:26", "remaining_time": "5:26:17", "throughput": 332.09, "total_tokens": 44143136} {"current_steps": 34870, "total_steps": 40000, "loss": 0.0312, "lr": 0.01201599278887252, "epoch": 1.7037842327706252, "percentage": 87.17, "elapsed_time": "1 day, 12:55:29", "remaining_time": "5:25:56", "throughput": 332.13, "total_tokens": 44149312} {"current_steps": 34875, "total_steps": 40000, "loss": 0.0417, "lr": 0.011992902794839744, "epoch": 1.7040285344343196, "percentage": 87.19, "elapsed_time": "1 day, 12:55:32", "remaining_time": "5:25:34", "throughput": 332.17, "total_tokens": 44155648} {"current_steps": 34880, "total_steps": 40000, "loss": 0.0671, "lr": 0.011969834083235703, "epoch": 1.704272836098014, "percentage": 87.2, "elapsed_time": "1 day, 12:55:35", "remaining_time": "5:25:13", "throughput": 332.21, "total_tokens": 44162016} {"current_steps": 34885, "total_steps": 40000, "loss": 0.0567, "lr": 0.011946786657617836, "epoch": 1.7045171377617083, "percentage": 87.21, "elapsed_time": "1 day, 12:55:38", "remaining_time": "5:24:52", "throughput": 332.25, "total_tokens": 44168384} {"current_steps": 34890, "total_steps": 40000, "loss": 0.0512, "lr": 0.011923760521540332, "epoch": 1.7047614394254025, "percentage": 87.22, "elapsed_time": "1 day, 12:55:41", "remaining_time": "5:24:30", "throughput": 332.29, "total_tokens": 44174688} {"current_steps": 34895, "total_steps": 40000, "loss": 0.0687, "lr": 0.011900755678554153, "epoch": 1.7050057410890969, "percentage": 87.24, "elapsed_time": "1 day, 12:55:44", "remaining_time": "5:24:09", "throughput": 332.33, "total_tokens": 44180800} {"current_steps": 34900, "total_steps": 40000, "loss": 0.0593, "lr": 0.011877772132206893, "epoch": 1.705250042752791, "percentage": 87.25, "elapsed_time": "1 day, 12:55:47", "remaining_time": "5:23:47", "throughput": 332.37, "total_tokens": 44187424} {"current_steps": 34905, "total_steps": 40000, "loss": 0.0575, "lr": 0.011854809886042915, "epoch": 1.7054943444164854, "percentage": 87.26, "elapsed_time": "1 day, 12:55:50", "remaining_time": "5:23:26", "throughput": 332.4, "total_tokens": 44193440} {"current_steps": 34910, "total_steps": 40000, "loss": 0.038, "lr": 0.011831868943603325, "epoch": 1.7057386460801798, "percentage": 87.28, "elapsed_time": "1 day, 12:55:53", "remaining_time": "5:23:05", "throughput": 332.45, "total_tokens": 44199936} {"current_steps": 34915, "total_steps": 40000, "loss": 0.0531, "lr": 0.011808949308425836, "epoch": 1.7059829477438742, "percentage": 87.29, "elapsed_time": "1 day, 12:55:56", "remaining_time": "5:22:43", "throughput": 332.48, "total_tokens": 44205728} {"current_steps": 34920, "total_steps": 40000, "loss": 0.0687, "lr": 0.01178605098404501, "epoch": 1.7062272494075685, "percentage": 87.3, "elapsed_time": "1 day, 12:55:59", "remaining_time": "5:22:22", "throughput": 332.52, "total_tokens": 44212320} {"current_steps": 34925, "total_steps": 40000, "loss": 0.0261, "lr": 0.011763173973992002, "epoch": 1.706471551071263, "percentage": 87.31, "elapsed_time": "1 day, 12:56:02", "remaining_time": "5:22:01", "throughput": 332.57, "total_tokens": 44218976} {"current_steps": 34930, "total_steps": 40000, "loss": 0.0696, "lr": 0.011740318281794776, "epoch": 1.706715852734957, "percentage": 87.33, "elapsed_time": "1 day, 12:56:05", "remaining_time": "5:21:39", "throughput": 332.6, "total_tokens": 44224896} {"current_steps": 34935, "total_steps": 40000, "loss": 0.06, "lr": 0.01171748391097796, "epoch": 1.7069601543986515, "percentage": 87.34, "elapsed_time": "1 day, 12:56:09", "remaining_time": "5:21:18", "throughput": 332.64, "total_tokens": 44231232} {"current_steps": 34940, "total_steps": 40000, "loss": 0.0629, "lr": 0.011694670865062873, "epoch": 1.7072044560623458, "percentage": 87.35, "elapsed_time": "1 day, 12:56:12", "remaining_time": "5:20:56", "throughput": 332.68, "total_tokens": 44237344} {"current_steps": 34945, "total_steps": 40000, "loss": 0.0382, "lr": 0.011671879147567616, "epoch": 1.70744875772604, "percentage": 87.36, "elapsed_time": "1 day, 12:56:15", "remaining_time": "5:20:35", "throughput": 332.72, "total_tokens": 44243680} {"current_steps": 34950, "total_steps": 40000, "loss": 0.0499, "lr": 0.011649108762006893, "epoch": 1.7076930593897344, "percentage": 87.38, "elapsed_time": "1 day, 12:56:18", "remaining_time": "5:20:14", "throughput": 332.76, "total_tokens": 44249792} {"current_steps": 34955, "total_steps": 40000, "loss": 0.0843, "lr": 0.011626359711892265, "epoch": 1.7079373610534287, "percentage": 87.39, "elapsed_time": "1 day, 12:56:21", "remaining_time": "5:19:52", "throughput": 332.8, "total_tokens": 44256064} {"current_steps": 34960, "total_steps": 40000, "loss": 0.0712, "lr": 0.01160363200073189, "epoch": 1.7081816627171231, "percentage": 87.4, "elapsed_time": "1 day, 12:56:24", "remaining_time": "5:19:31", "throughput": 332.84, "total_tokens": 44262368} {"current_steps": 34965, "total_steps": 40000, "loss": 0.0632, "lr": 0.011580925632030614, "epoch": 1.7084259643808175, "percentage": 87.41, "elapsed_time": "1 day, 12:56:27", "remaining_time": "5:19:10", "throughput": 332.88, "total_tokens": 44268416} {"current_steps": 34970, "total_steps": 40000, "loss": 0.0391, "lr": 0.011558240609290104, "epoch": 1.7086702660445119, "percentage": 87.42, "elapsed_time": "1 day, 12:56:30", "remaining_time": "5:18:48", "throughput": 332.92, "total_tokens": 44274624} {"current_steps": 34975, "total_steps": 40000, "loss": 0.0709, "lr": 0.011535576936008679, "epoch": 1.708914567708206, "percentage": 87.44, "elapsed_time": "1 day, 12:56:33", "remaining_time": "5:18:27", "throughput": 332.96, "total_tokens": 44281184} {"current_steps": 34980, "total_steps": 40000, "loss": 0.0581, "lr": 0.011512934615681309, "epoch": 1.7091588693719004, "percentage": 87.45, "elapsed_time": "1 day, 12:56:36", "remaining_time": "5:18:06", "throughput": 333.0, "total_tokens": 44287424} {"current_steps": 34985, "total_steps": 40000, "loss": 0.0527, "lr": 0.011490313651799765, "epoch": 1.7094031710355948, "percentage": 87.46, "elapsed_time": "1 day, 12:56:39", "remaining_time": "5:17:45", "throughput": 333.04, "total_tokens": 44293920} {"current_steps": 34990, "total_steps": 40000, "loss": 0.0604, "lr": 0.011467714047852512, "epoch": 1.709647472699289, "percentage": 87.48, "elapsed_time": "1 day, 12:56:42", "remaining_time": "5:17:23", "throughput": 333.08, "total_tokens": 44300096} {"current_steps": 34995, "total_steps": 40000, "loss": 0.0389, "lr": 0.011445135807324624, "epoch": 1.7098917743629833, "percentage": 87.49, "elapsed_time": "1 day, 12:56:45", "remaining_time": "5:17:02", "throughput": 333.12, "total_tokens": 44306656} {"current_steps": 35000, "total_steps": 40000, "loss": 0.0393, "lr": 0.011422578933698002, "epoch": 1.7101360760266777, "percentage": 87.5, "elapsed_time": "1 day, 12:56:48", "remaining_time": "5:16:41", "throughput": 333.16, "total_tokens": 44313216} {"current_steps": 35000, "total_steps": 40000, "eval_loss": 0.060744963586330414, "epoch": 1.7101360760266777, "percentage": 87.5, "elapsed_time": "1 day, 13:07:23", "remaining_time": "5:18:11", "throughput": 331.58, "total_tokens": 44313216} {"current_steps": 35005, "total_steps": 40000, "loss": 0.0654, "lr": 0.011400043430451161, "epoch": 1.710380377690372, "percentage": 87.51, "elapsed_time": "1 day, 13:07:27", "remaining_time": "5:17:50", "throughput": 331.61, "total_tokens": 44319232} {"current_steps": 35010, "total_steps": 40000, "loss": 0.0495, "lr": 0.011377529301059392, "epoch": 1.7106246793540665, "percentage": 87.52, "elapsed_time": "1 day, 13:07:30", "remaining_time": "5:17:29", "throughput": 331.65, "total_tokens": 44325600} {"current_steps": 35015, "total_steps": 40000, "loss": 0.0742, "lr": 0.011355036548994646, "epoch": 1.7108689810177609, "percentage": 87.54, "elapsed_time": "1 day, 13:07:33", "remaining_time": "5:17:07", "throughput": 331.69, "total_tokens": 44331840} {"current_steps": 35020, "total_steps": 40000, "loss": 0.0546, "lr": 0.011332565177725584, "epoch": 1.711113282681455, "percentage": 87.55, "elapsed_time": "1 day, 13:07:36", "remaining_time": "5:16:46", "throughput": 331.73, "total_tokens": 44338048} {"current_steps": 35025, "total_steps": 40000, "loss": 0.0732, "lr": 0.011310115190717585, "epoch": 1.7113575843451494, "percentage": 87.56, "elapsed_time": "1 day, 13:07:39", "remaining_time": "5:16:25", "throughput": 331.77, "total_tokens": 44344608} {"current_steps": 35030, "total_steps": 40000, "loss": 0.0382, "lr": 0.01128768659143271, "epoch": 1.7116018860088436, "percentage": 87.58, "elapsed_time": "1 day, 13:07:42", "remaining_time": "5:16:03", "throughput": 331.81, "total_tokens": 44350880} {"current_steps": 35035, "total_steps": 40000, "loss": 0.053, "lr": 0.011265279383329713, "epoch": 1.711846187672538, "percentage": 87.59, "elapsed_time": "1 day, 13:07:45", "remaining_time": "5:15:42", "throughput": 331.85, "total_tokens": 44357088} {"current_steps": 35040, "total_steps": 40000, "loss": 0.0418, "lr": 0.01124289356986411, "epoch": 1.7120904893362323, "percentage": 87.6, "elapsed_time": "1 day, 13:07:48", "remaining_time": "5:15:21", "throughput": 331.9, "total_tokens": 44364064} {"current_steps": 35045, "total_steps": 40000, "loss": 0.0488, "lr": 0.011220529154488023, "epoch": 1.7123347909999267, "percentage": 87.61, "elapsed_time": "1 day, 13:07:51", "remaining_time": "5:14:59", "throughput": 331.93, "total_tokens": 44370176} {"current_steps": 35050, "total_steps": 40000, "loss": 0.0649, "lr": 0.011198186140650346, "epoch": 1.712579092663621, "percentage": 87.62, "elapsed_time": "1 day, 13:07:54", "remaining_time": "5:14:38", "throughput": 331.97, "total_tokens": 44376576} {"current_steps": 35055, "total_steps": 40000, "loss": 0.0566, "lr": 0.011175864531796685, "epoch": 1.7128233943273155, "percentage": 87.64, "elapsed_time": "1 day, 13:07:58", "remaining_time": "5:14:17", "throughput": 332.02, "total_tokens": 44383456} {"current_steps": 35060, "total_steps": 40000, "loss": 0.0509, "lr": 0.011153564331369258, "epoch": 1.7130676959910098, "percentage": 87.65, "elapsed_time": "1 day, 13:08:01", "remaining_time": "5:13:55", "throughput": 332.06, "total_tokens": 44390080} {"current_steps": 35065, "total_steps": 40000, "loss": 0.0746, "lr": 0.011131285542807078, "epoch": 1.713311997654704, "percentage": 87.66, "elapsed_time": "1 day, 13:08:04", "remaining_time": "5:13:34", "throughput": 332.1, "total_tokens": 44396544} {"current_steps": 35070, "total_steps": 40000, "loss": 0.0524, "lr": 0.011109028169545815, "epoch": 1.7135562993183984, "percentage": 87.67, "elapsed_time": "1 day, 13:08:07", "remaining_time": "5:13:13", "throughput": 332.14, "total_tokens": 44403424} {"current_steps": 35075, "total_steps": 40000, "loss": 0.056, "lr": 0.011086792215017804, "epoch": 1.7138006009820925, "percentage": 87.69, "elapsed_time": "1 day, 13:08:10", "remaining_time": "5:12:51", "throughput": 332.19, "total_tokens": 44410080} {"current_steps": 35080, "total_steps": 40000, "loss": 0.0573, "lr": 0.011064577682652137, "epoch": 1.714044902645787, "percentage": 87.7, "elapsed_time": "1 day, 13:08:13", "remaining_time": "5:12:30", "throughput": 332.22, "total_tokens": 44416192} {"current_steps": 35085, "total_steps": 40000, "loss": 0.0804, "lr": 0.011042384575874559, "epoch": 1.7142892043094813, "percentage": 87.71, "elapsed_time": "1 day, 13:08:16", "remaining_time": "5:12:09", "throughput": 332.26, "total_tokens": 44422208} {"current_steps": 35090, "total_steps": 40000, "loss": 0.0461, "lr": 0.011020212898107512, "epoch": 1.7145335059731757, "percentage": 87.72, "elapsed_time": "1 day, 13:08:19", "remaining_time": "5:11:48", "throughput": 332.3, "total_tokens": 44428736} {"current_steps": 35095, "total_steps": 40000, "loss": 0.0644, "lr": 0.010998062652770197, "epoch": 1.71477780763687, "percentage": 87.74, "elapsed_time": "1 day, 13:08:22", "remaining_time": "5:11:26", "throughput": 332.34, "total_tokens": 44434816} {"current_steps": 35100, "total_steps": 40000, "loss": 0.037, "lr": 0.010975933843278428, "epoch": 1.7150221093005644, "percentage": 87.75, "elapsed_time": "1 day, 13:08:25", "remaining_time": "5:11:05", "throughput": 332.38, "total_tokens": 44440864} {"current_steps": 35105, "total_steps": 40000, "loss": 0.0751, "lr": 0.010953826473044714, "epoch": 1.7152664109642588, "percentage": 87.76, "elapsed_time": "1 day, 13:08:28", "remaining_time": "5:10:44", "throughput": 332.42, "total_tokens": 44447168} {"current_steps": 35110, "total_steps": 40000, "loss": 0.057, "lr": 0.010931740545478357, "epoch": 1.715510712627953, "percentage": 87.78, "elapsed_time": "1 day, 13:08:31", "remaining_time": "5:10:22", "throughput": 332.46, "total_tokens": 44453248} {"current_steps": 35115, "total_steps": 40000, "loss": 0.0399, "lr": 0.010909676063985218, "epoch": 1.7157550142916473, "percentage": 87.79, "elapsed_time": "1 day, 13:08:34", "remaining_time": "5:10:01", "throughput": 332.5, "total_tokens": 44459616} {"current_steps": 35120, "total_steps": 40000, "loss": 0.0296, "lr": 0.010887633031967974, "epoch": 1.7159993159553415, "percentage": 87.8, "elapsed_time": "1 day, 13:08:37", "remaining_time": "5:09:40", "throughput": 332.54, "total_tokens": 44466016} {"current_steps": 35125, "total_steps": 40000, "loss": 0.0465, "lr": 0.01086561145282589, "epoch": 1.7162436176190359, "percentage": 87.81, "elapsed_time": "1 day, 13:08:41", "remaining_time": "5:09:19", "throughput": 332.58, "total_tokens": 44472608} {"current_steps": 35130, "total_steps": 40000, "loss": 0.0287, "lr": 0.010843611329954983, "epoch": 1.7164879192827303, "percentage": 87.83, "elapsed_time": "1 day, 13:08:44", "remaining_time": "5:08:57", "throughput": 332.62, "total_tokens": 44479104} {"current_steps": 35135, "total_steps": 40000, "loss": 0.0803, "lr": 0.010821632666747988, "epoch": 1.7167322209464246, "percentage": 87.84, "elapsed_time": "1 day, 13:08:47", "remaining_time": "5:08:36", "throughput": 332.66, "total_tokens": 44485408} {"current_steps": 35140, "total_steps": 40000, "loss": 0.044, "lr": 0.010799675466594244, "epoch": 1.716976522610119, "percentage": 87.85, "elapsed_time": "1 day, 13:08:50", "remaining_time": "5:08:15", "throughput": 332.7, "total_tokens": 44491712} {"current_steps": 35145, "total_steps": 40000, "loss": 0.0338, "lr": 0.010777739732879826, "epoch": 1.7172208242738134, "percentage": 87.86, "elapsed_time": "1 day, 13:08:53", "remaining_time": "5:07:54", "throughput": 332.74, "total_tokens": 44498112} {"current_steps": 35150, "total_steps": 40000, "loss": 0.0419, "lr": 0.010755825468987562, "epoch": 1.7174651259375078, "percentage": 87.88, "elapsed_time": "1 day, 13:08:56", "remaining_time": "5:07:32", "throughput": 332.77, "total_tokens": 44503872} {"current_steps": 35155, "total_steps": 40000, "loss": 0.0785, "lr": 0.010733932678296814, "epoch": 1.717709427601202, "percentage": 87.89, "elapsed_time": "1 day, 13:08:59", "remaining_time": "5:07:11", "throughput": 332.81, "total_tokens": 44510112} {"current_steps": 35160, "total_steps": 40000, "loss": 0.0822, "lr": 0.010712061364183817, "epoch": 1.7179537292648963, "percentage": 87.9, "elapsed_time": "1 day, 13:09:02", "remaining_time": "5:06:50", "throughput": 332.85, "total_tokens": 44516032} {"current_steps": 35165, "total_steps": 40000, "loss": 0.0461, "lr": 0.010690211530021337, "epoch": 1.7181980309285905, "percentage": 87.91, "elapsed_time": "1 day, 13:09:05", "remaining_time": "5:06:29", "throughput": 332.89, "total_tokens": 44522208} {"current_steps": 35170, "total_steps": 40000, "loss": 0.0671, "lr": 0.01066838317917893, "epoch": 1.7184423325922848, "percentage": 87.92, "elapsed_time": "1 day, 13:09:08", "remaining_time": "5:06:08", "throughput": 332.93, "total_tokens": 44528384} {"current_steps": 35175, "total_steps": 40000, "loss": 0.0582, "lr": 0.010646576315022787, "epoch": 1.7186866342559792, "percentage": 87.94, "elapsed_time": "1 day, 13:09:11", "remaining_time": "5:05:46", "throughput": 332.97, "total_tokens": 44534784} {"current_steps": 35180, "total_steps": 40000, "loss": 0.0648, "lr": 0.010624790940915785, "epoch": 1.7189309359196736, "percentage": 87.95, "elapsed_time": "1 day, 13:09:14", "remaining_time": "5:05:25", "throughput": 333.01, "total_tokens": 44540992} {"current_steps": 35185, "total_steps": 40000, "loss": 0.081, "lr": 0.0106030270602175, "epoch": 1.719175237583368, "percentage": 87.96, "elapsed_time": "1 day, 13:09:17", "remaining_time": "5:05:04", "throughput": 333.05, "total_tokens": 44547296} {"current_steps": 35190, "total_steps": 40000, "loss": 0.0422, "lr": 0.010581284676284252, "epoch": 1.7194195392470624, "percentage": 87.98, "elapsed_time": "1 day, 13:09:20", "remaining_time": "5:04:43", "throughput": 333.09, "total_tokens": 44553856} {"current_steps": 35195, "total_steps": 40000, "loss": 0.0337, "lr": 0.010559563792468923, "epoch": 1.7196638409107567, "percentage": 87.99, "elapsed_time": "1 day, 13:09:23", "remaining_time": "5:04:22", "throughput": 333.13, "total_tokens": 44560128} {"current_steps": 35200, "total_steps": 40000, "loss": 0.0427, "lr": 0.010537864412121217, "epoch": 1.719908142574451, "percentage": 88.0, "elapsed_time": "1 day, 13:09:26", "remaining_time": "5:04:00", "throughput": 333.16, "total_tokens": 44566336} {"current_steps": 35200, "total_steps": 40000, "eval_loss": 0.06109674274921417, "epoch": 1.719908142574451, "percentage": 88.0, "elapsed_time": "1 day, 13:20:01", "remaining_time": "5:05:27", "throughput": 331.59, "total_tokens": 44566336} {"current_steps": 35205, "total_steps": 40000, "loss": 0.0473, "lr": 0.010516186538587357, "epoch": 1.7201524442381453, "percentage": 88.01, "elapsed_time": "1 day, 13:20:05", "remaining_time": "5:05:06", "throughput": 331.63, "total_tokens": 44572416} {"current_steps": 35210, "total_steps": 40000, "loss": 0.05, "lr": 0.01049453017521042, "epoch": 1.7203967459018394, "percentage": 88.02, "elapsed_time": "1 day, 13:20:08", "remaining_time": "5:04:45", "throughput": 331.66, "total_tokens": 44578368} {"current_steps": 35215, "total_steps": 40000, "loss": 0.0638, "lr": 0.010472895325330083, "epoch": 1.7206410475655338, "percentage": 88.04, "elapsed_time": "1 day, 13:20:11", "remaining_time": "5:04:23", "throughput": 331.71, "total_tokens": 44585184} {"current_steps": 35220, "total_steps": 40000, "loss": 0.0581, "lr": 0.010451281992282662, "epoch": 1.7208853492292282, "percentage": 88.05, "elapsed_time": "1 day, 13:20:14", "remaining_time": "5:04:02", "throughput": 331.75, "total_tokens": 44591520} {"current_steps": 35225, "total_steps": 40000, "loss": 0.0501, "lr": 0.01042969017940124, "epoch": 1.7211296508929226, "percentage": 88.06, "elapsed_time": "1 day, 13:20:17", "remaining_time": "5:03:41", "throughput": 331.78, "total_tokens": 44597472} {"current_steps": 35230, "total_steps": 40000, "loss": 0.0512, "lr": 0.01040811989001557, "epoch": 1.721373952556617, "percentage": 88.08, "elapsed_time": "1 day, 13:20:20", "remaining_time": "5:03:20", "throughput": 331.82, "total_tokens": 44603808} {"current_steps": 35235, "total_steps": 40000, "loss": 0.0334, "lr": 0.010386571127451992, "epoch": 1.7216182542203113, "percentage": 88.09, "elapsed_time": "1 day, 13:20:23", "remaining_time": "5:02:58", "throughput": 331.86, "total_tokens": 44609760} {"current_steps": 35240, "total_steps": 40000, "loss": 0.0433, "lr": 0.010365043895033682, "epoch": 1.7218625558840057, "percentage": 88.1, "elapsed_time": "1 day, 13:20:26", "remaining_time": "5:02:37", "throughput": 331.9, "total_tokens": 44615968} {"current_steps": 35245, "total_steps": 40000, "loss": 0.0502, "lr": 0.010343538196080365, "epoch": 1.7221068575476999, "percentage": 88.11, "elapsed_time": "1 day, 13:20:29", "remaining_time": "5:02:16", "throughput": 331.94, "total_tokens": 44622368} {"current_steps": 35250, "total_steps": 40000, "loss": 0.0304, "lr": 0.010322054033908457, "epoch": 1.7223511592113943, "percentage": 88.12, "elapsed_time": "1 day, 13:20:32", "remaining_time": "5:01:55", "throughput": 331.98, "total_tokens": 44628512} {"current_steps": 35255, "total_steps": 40000, "loss": 0.0798, "lr": 0.010300591411831156, "epoch": 1.7225954608750884, "percentage": 88.14, "elapsed_time": "1 day, 13:20:35", "remaining_time": "5:01:33", "throughput": 332.02, "total_tokens": 44634944} {"current_steps": 35260, "total_steps": 40000, "loss": 0.0646, "lr": 0.010279150333158198, "epoch": 1.7228397625387828, "percentage": 88.15, "elapsed_time": "1 day, 13:20:39", "remaining_time": "5:01:12", "throughput": 332.05, "total_tokens": 44641088} {"current_steps": 35265, "total_steps": 40000, "loss": 0.0542, "lr": 0.010257730801196107, "epoch": 1.7230840642024772, "percentage": 88.16, "elapsed_time": "1 day, 13:20:42", "remaining_time": "5:00:51", "throughput": 332.1, "total_tokens": 44648192} {"current_steps": 35270, "total_steps": 40000, "loss": 0.0367, "lr": 0.010236332819248056, "epoch": 1.7233283658661716, "percentage": 88.17, "elapsed_time": "1 day, 13:20:45", "remaining_time": "5:00:30", "throughput": 332.14, "total_tokens": 44654688} {"current_steps": 35275, "total_steps": 40000, "loss": 0.0677, "lr": 0.010214956390613854, "epoch": 1.723572667529866, "percentage": 88.19, "elapsed_time": "1 day, 13:20:48", "remaining_time": "5:00:09", "throughput": 332.18, "total_tokens": 44660800} {"current_steps": 35280, "total_steps": 40000, "loss": 0.0535, "lr": 0.010193601518590034, "epoch": 1.7238169691935603, "percentage": 88.2, "elapsed_time": "1 day, 13:20:51", "remaining_time": "4:59:47", "throughput": 332.21, "total_tokens": 44666752} {"current_steps": 35285, "total_steps": 40000, "loss": 0.0769, "lr": 0.010172268206469758, "epoch": 1.7240612708572547, "percentage": 88.21, "elapsed_time": "1 day, 13:20:54", "remaining_time": "4:59:26", "throughput": 332.25, "total_tokens": 44672704} {"current_steps": 35290, "total_steps": 40000, "loss": 0.0632, "lr": 0.010150956457542897, "epoch": 1.7243055725209488, "percentage": 88.22, "elapsed_time": "1 day, 13:20:57", "remaining_time": "4:59:05", "throughput": 332.29, "total_tokens": 44678688} {"current_steps": 35295, "total_steps": 40000, "loss": 0.058, "lr": 0.010129666275096054, "epoch": 1.7245498741846432, "percentage": 88.24, "elapsed_time": "1 day, 13:21:00", "remaining_time": "4:58:44", "throughput": 332.33, "total_tokens": 44684960} {"current_steps": 35300, "total_steps": 40000, "loss": 0.0716, "lr": 0.010108397662412338, "epoch": 1.7247941758483374, "percentage": 88.25, "elapsed_time": "1 day, 13:21:03", "remaining_time": "4:58:23", "throughput": 332.37, "total_tokens": 44691232} {"current_steps": 35305, "total_steps": 40000, "loss": 0.0841, "lr": 0.010087150622771707, "epoch": 1.7250384775120318, "percentage": 88.26, "elapsed_time": "1 day, 13:21:06", "remaining_time": "4:58:01", "throughput": 332.41, "total_tokens": 44697664} {"current_steps": 35310, "total_steps": 40000, "loss": 0.0386, "lr": 0.010065925159450739, "epoch": 1.7252827791757261, "percentage": 88.28, "elapsed_time": "1 day, 13:21:09", "remaining_time": "4:57:40", "throughput": 332.45, "total_tokens": 44703936} {"current_steps": 35315, "total_steps": 40000, "loss": 0.0506, "lr": 0.010044721275722618, "epoch": 1.7255270808394205, "percentage": 88.29, "elapsed_time": "1 day, 13:21:12", "remaining_time": "4:57:19", "throughput": 332.49, "total_tokens": 44710624} {"current_steps": 35320, "total_steps": 40000, "loss": 0.0541, "lr": 0.01002353897485726, "epoch": 1.725771382503115, "percentage": 88.3, "elapsed_time": "1 day, 13:21:15", "remaining_time": "4:56:58", "throughput": 332.53, "total_tokens": 44716864} {"current_steps": 35325, "total_steps": 40000, "loss": 0.0275, "lr": 0.010002378260121236, "epoch": 1.7260156841668093, "percentage": 88.31, "elapsed_time": "1 day, 13:21:18", "remaining_time": "4:56:37", "throughput": 332.57, "total_tokens": 44723200} {"current_steps": 35330, "total_steps": 40000, "loss": 0.0665, "lr": 0.009981239134777786, "epoch": 1.7262599858305037, "percentage": 88.33, "elapsed_time": "1 day, 13:21:22", "remaining_time": "4:56:16", "throughput": 332.61, "total_tokens": 44729760} {"current_steps": 35335, "total_steps": 40000, "loss": 0.0461, "lr": 0.009960121602086884, "epoch": 1.7265042874941978, "percentage": 88.34, "elapsed_time": "1 day, 13:21:25", "remaining_time": "4:55:54", "throughput": 332.65, "total_tokens": 44735808} {"current_steps": 35340, "total_steps": 40000, "loss": 0.0532, "lr": 0.009939025665305062, "epoch": 1.7267485891578922, "percentage": 88.35, "elapsed_time": "1 day, 13:21:28", "remaining_time": "4:55:33", "throughput": 332.69, "total_tokens": 44742240} {"current_steps": 35345, "total_steps": 40000, "loss": 0.0346, "lr": 0.009917951327685597, "epoch": 1.7269928908215864, "percentage": 88.36, "elapsed_time": "1 day, 13:21:31", "remaining_time": "4:55:12", "throughput": 332.72, "total_tokens": 44748128} {"current_steps": 35350, "total_steps": 40000, "loss": 0.0419, "lr": 0.009896898592478425, "epoch": 1.7272371924852807, "percentage": 88.38, "elapsed_time": "1 day, 13:21:34", "remaining_time": "4:54:51", "throughput": 332.76, "total_tokens": 44754976} {"current_steps": 35355, "total_steps": 40000, "loss": 0.0353, "lr": 0.009875867462930132, "epoch": 1.7274814941489751, "percentage": 88.39, "elapsed_time": "1 day, 13:21:37", "remaining_time": "4:54:30", "throughput": 332.8, "total_tokens": 44760960} {"current_steps": 35360, "total_steps": 40000, "loss": 0.0493, "lr": 0.009854857942284006, "epoch": 1.7277257958126695, "percentage": 88.4, "elapsed_time": "1 day, 13:21:40", "remaining_time": "4:54:09", "throughput": 332.84, "total_tokens": 44767296} {"current_steps": 35365, "total_steps": 40000, "loss": 0.0717, "lr": 0.009833870033779923, "epoch": 1.7279700974763639, "percentage": 88.41, "elapsed_time": "1 day, 13:21:43", "remaining_time": "4:53:48", "throughput": 332.88, "total_tokens": 44773664} {"current_steps": 35370, "total_steps": 40000, "loss": 0.0509, "lr": 0.009812903740654527, "epoch": 1.7282143991400583, "percentage": 88.42, "elapsed_time": "1 day, 13:21:46", "remaining_time": "4:53:27", "throughput": 332.92, "total_tokens": 44780000} {"current_steps": 35375, "total_steps": 40000, "loss": 0.1287, "lr": 0.009791959066141097, "epoch": 1.7284587008037526, "percentage": 88.44, "elapsed_time": "1 day, 13:21:49", "remaining_time": "4:53:06", "throughput": 332.96, "total_tokens": 44786144} {"current_steps": 35380, "total_steps": 40000, "loss": 0.0485, "lr": 0.009771036013469537, "epoch": 1.7287030024674468, "percentage": 88.45, "elapsed_time": "1 day, 13:21:52", "remaining_time": "4:52:44", "throughput": 333.0, "total_tokens": 44792480} {"current_steps": 35385, "total_steps": 40000, "loss": 0.0558, "lr": 0.00975013458586646, "epoch": 1.7289473041311412, "percentage": 88.46, "elapsed_time": "1 day, 13:21:55", "remaining_time": "4:52:23", "throughput": 333.04, "total_tokens": 44798784} {"current_steps": 35390, "total_steps": 40000, "loss": 0.1024, "lr": 0.009729254786555107, "epoch": 1.7291916057948353, "percentage": 88.48, "elapsed_time": "1 day, 13:21:58", "remaining_time": "4:52:02", "throughput": 333.08, "total_tokens": 44805216} {"current_steps": 35395, "total_steps": 40000, "loss": 0.0929, "lr": 0.009708396618755421, "epoch": 1.7294359074585297, "percentage": 88.49, "elapsed_time": "1 day, 13:22:01", "remaining_time": "4:51:41", "throughput": 333.12, "total_tokens": 44811552} {"current_steps": 35400, "total_steps": 40000, "loss": 0.0681, "lr": 0.009687560085683994, "epoch": 1.729680209122224, "percentage": 88.5, "elapsed_time": "1 day, 13:22:05", "remaining_time": "4:51:20", "throughput": 333.16, "total_tokens": 44817984} {"current_steps": 35400, "total_steps": 40000, "eval_loss": 0.06068366393446922, "epoch": 1.729680209122224, "percentage": 88.5, "elapsed_time": "1 day, 13:32:39", "remaining_time": "4:52:43", "throughput": 331.59, "total_tokens": 44817984} {"current_steps": 35405, "total_steps": 40000, "loss": 0.035, "lr": 0.009666745190554054, "epoch": 1.7299245107859185, "percentage": 88.51, "elapsed_time": "1 day, 13:32:43", "remaining_time": "4:52:22", "throughput": 331.63, "total_tokens": 44824480} {"current_steps": 35410, "total_steps": 40000, "loss": 0.0516, "lr": 0.009645951936575553, "epoch": 1.7301688124496128, "percentage": 88.52, "elapsed_time": "1 day, 13:32:46", "remaining_time": "4:52:00", "throughput": 331.67, "total_tokens": 44830752} {"current_steps": 35415, "total_steps": 40000, "loss": 0.0604, "lr": 0.00962518032695509, "epoch": 1.7304131141133072, "percentage": 88.54, "elapsed_time": "1 day, 13:32:49", "remaining_time": "4:51:39", "throughput": 331.71, "total_tokens": 44836928} {"current_steps": 35420, "total_steps": 40000, "loss": 0.063, "lr": 0.009604430364895855, "epoch": 1.7306574157770016, "percentage": 88.55, "elapsed_time": "1 day, 13:32:52", "remaining_time": "4:51:18", "throughput": 331.75, "total_tokens": 44843104} {"current_steps": 35425, "total_steps": 40000, "loss": 0.0555, "lr": 0.00958370205359777, "epoch": 1.7309017174406958, "percentage": 88.56, "elapsed_time": "1 day, 13:32:55", "remaining_time": "4:50:57", "throughput": 331.79, "total_tokens": 44849728} {"current_steps": 35430, "total_steps": 40000, "loss": 0.0411, "lr": 0.009562995396257445, "epoch": 1.7311460191043901, "percentage": 88.58, "elapsed_time": "1 day, 13:32:58", "remaining_time": "4:50:36", "throughput": 331.83, "total_tokens": 44856160} {"current_steps": 35435, "total_steps": 40000, "loss": 0.0423, "lr": 0.009542310396068026, "epoch": 1.7313903207680843, "percentage": 88.59, "elapsed_time": "1 day, 13:33:02", "remaining_time": "4:50:15", "throughput": 331.87, "total_tokens": 44862720} {"current_steps": 35440, "total_steps": 40000, "loss": 0.0453, "lr": 0.009521647056219495, "epoch": 1.7316346224317787, "percentage": 88.6, "elapsed_time": "1 day, 13:33:05", "remaining_time": "4:49:54", "throughput": 331.91, "total_tokens": 44868992} {"current_steps": 35445, "total_steps": 40000, "loss": 0.0479, "lr": 0.00950100537989832, "epoch": 1.731878924095473, "percentage": 88.61, "elapsed_time": "1 day, 13:33:08", "remaining_time": "4:49:32", "throughput": 331.95, "total_tokens": 44875552} {"current_steps": 35450, "total_steps": 40000, "loss": 0.0775, "lr": 0.00948038537028772, "epoch": 1.7321232257591674, "percentage": 88.62, "elapsed_time": "1 day, 13:33:11", "remaining_time": "4:49:11", "throughput": 331.99, "total_tokens": 44881600} {"current_steps": 35455, "total_steps": 40000, "loss": 0.0369, "lr": 0.009459787030567617, "epoch": 1.7323675274228618, "percentage": 88.64, "elapsed_time": "1 day, 13:33:14", "remaining_time": "4:48:50", "throughput": 332.03, "total_tokens": 44888224} {"current_steps": 35460, "total_steps": 40000, "loss": 0.056, "lr": 0.00943921036391449, "epoch": 1.7326118290865562, "percentage": 88.65, "elapsed_time": "1 day, 13:33:17", "remaining_time": "4:48:29", "throughput": 332.07, "total_tokens": 44894400} {"current_steps": 35465, "total_steps": 40000, "loss": 0.0732, "lr": 0.009418655373501483, "epoch": 1.7328561307502504, "percentage": 88.66, "elapsed_time": "1 day, 13:33:20", "remaining_time": "4:48:08", "throughput": 332.11, "total_tokens": 44900928} {"current_steps": 35470, "total_steps": 40000, "loss": 0.0987, "lr": 0.00939812206249851, "epoch": 1.7331004324139447, "percentage": 88.67, "elapsed_time": "1 day, 13:33:23", "remaining_time": "4:47:47", "throughput": 332.15, "total_tokens": 44907200} {"current_steps": 35475, "total_steps": 40000, "loss": 0.0748, "lr": 0.009377610434072004, "epoch": 1.7333447340776391, "percentage": 88.69, "elapsed_time": "1 day, 13:33:26", "remaining_time": "4:47:26", "throughput": 332.18, "total_tokens": 44913472} {"current_steps": 35480, "total_steps": 40000, "loss": 0.0484, "lr": 0.009357120491385167, "epoch": 1.7335890357413333, "percentage": 88.7, "elapsed_time": "1 day, 13:33:29", "remaining_time": "4:47:05", "throughput": 332.23, "total_tokens": 44920096} {"current_steps": 35485, "total_steps": 40000, "loss": 0.0851, "lr": 0.009336652237597743, "epoch": 1.7338333374050277, "percentage": 88.71, "elapsed_time": "1 day, 13:33:32", "remaining_time": "4:46:44", "throughput": 332.26, "total_tokens": 44926400} {"current_steps": 35490, "total_steps": 40000, "loss": 0.0458, "lr": 0.009316205675866251, "epoch": 1.734077639068722, "percentage": 88.72, "elapsed_time": "1 day, 13:33:35", "remaining_time": "4:46:22", "throughput": 332.3, "total_tokens": 44932416} {"current_steps": 35495, "total_steps": 40000, "loss": 0.0516, "lr": 0.00929578080934379, "epoch": 1.7343219407324164, "percentage": 88.74, "elapsed_time": "1 day, 13:33:38", "remaining_time": "4:46:01", "throughput": 332.34, "total_tokens": 44938912} {"current_steps": 35500, "total_steps": 40000, "loss": 0.061, "lr": 0.00927537764118012, "epoch": 1.7345662423961108, "percentage": 88.75, "elapsed_time": "1 day, 13:33:41", "remaining_time": "4:45:40", "throughput": 332.38, "total_tokens": 44945216} {"current_steps": 35505, "total_steps": 40000, "loss": 0.046, "lr": 0.009254996174521678, "epoch": 1.7348105440598052, "percentage": 88.76, "elapsed_time": "1 day, 13:33:45", "remaining_time": "4:45:19", "throughput": 332.42, "total_tokens": 44951584} {"current_steps": 35510, "total_steps": 40000, "loss": 0.0446, "lr": 0.009234636412511531, "epoch": 1.7350548457234993, "percentage": 88.78, "elapsed_time": "1 day, 13:33:48", "remaining_time": "4:44:58", "throughput": 332.46, "total_tokens": 44958016} {"current_steps": 35515, "total_steps": 40000, "loss": 0.0344, "lr": 0.009214298358289418, "epoch": 1.7352991473871937, "percentage": 88.79, "elapsed_time": "1 day, 13:33:51", "remaining_time": "4:44:37", "throughput": 332.5, "total_tokens": 44964224} {"current_steps": 35520, "total_steps": 40000, "loss": 0.0662, "lr": 0.00919398201499173, "epoch": 1.735543449050888, "percentage": 88.8, "elapsed_time": "1 day, 13:33:54", "remaining_time": "4:44:16", "throughput": 332.54, "total_tokens": 44970336} {"current_steps": 35525, "total_steps": 40000, "loss": 0.0729, "lr": 0.009173687385751495, "epoch": 1.7357877507145822, "percentage": 88.81, "elapsed_time": "1 day, 13:33:57", "remaining_time": "4:43:55", "throughput": 332.57, "total_tokens": 44976416} {"current_steps": 35530, "total_steps": 40000, "loss": 0.0782, "lr": 0.009153414473698407, "epoch": 1.7360320523782766, "percentage": 88.83, "elapsed_time": "1 day, 13:34:00", "remaining_time": "4:43:34", "throughput": 332.62, "total_tokens": 44983200} {"current_steps": 35535, "total_steps": 40000, "loss": 0.0681, "lr": 0.009133163281958784, "epoch": 1.736276354041971, "percentage": 88.84, "elapsed_time": "1 day, 13:34:03", "remaining_time": "4:43:13", "throughput": 332.66, "total_tokens": 44989696} {"current_steps": 35540, "total_steps": 40000, "loss": 0.0465, "lr": 0.009112933813655627, "epoch": 1.7365206557056654, "percentage": 88.85, "elapsed_time": "1 day, 13:34:06", "remaining_time": "4:42:52", "throughput": 332.7, "total_tokens": 44996384} {"current_steps": 35545, "total_steps": 40000, "loss": 0.0351, "lr": 0.009092726071908573, "epoch": 1.7367649573693598, "percentage": 88.86, "elapsed_time": "1 day, 13:34:09", "remaining_time": "4:42:31", "throughput": 332.74, "total_tokens": 45002688} {"current_steps": 35550, "total_steps": 40000, "loss": 0.0438, "lr": 0.0090725400598339, "epoch": 1.7370092590330541, "percentage": 88.88, "elapsed_time": "1 day, 13:34:12", "remaining_time": "4:42:10", "throughput": 332.78, "total_tokens": 45008800} {"current_steps": 35555, "total_steps": 40000, "loss": 0.0413, "lr": 0.009052375780544563, "epoch": 1.7372535606967483, "percentage": 88.89, "elapsed_time": "1 day, 13:34:15", "remaining_time": "4:41:49", "throughput": 332.81, "total_tokens": 45015008} {"current_steps": 35560, "total_steps": 40000, "loss": 0.0576, "lr": 0.009032233237150144, "epoch": 1.7374978623604427, "percentage": 88.9, "elapsed_time": "1 day, 13:34:18", "remaining_time": "4:41:28", "throughput": 332.85, "total_tokens": 45021312} {"current_steps": 35565, "total_steps": 40000, "loss": 0.0554, "lr": 0.009012112432756875, "epoch": 1.737742164024137, "percentage": 88.91, "elapsed_time": "1 day, 13:34:21", "remaining_time": "4:41:07", "throughput": 332.89, "total_tokens": 45027424} {"current_steps": 35570, "total_steps": 40000, "loss": 0.062, "lr": 0.008992013370467605, "epoch": 1.7379864656878312, "percentage": 88.92, "elapsed_time": "1 day, 13:34:25", "remaining_time": "4:40:46", "throughput": 332.93, "total_tokens": 45033760} {"current_steps": 35575, "total_steps": 40000, "loss": 0.0657, "lr": 0.008971936053381924, "epoch": 1.7382307673515256, "percentage": 88.94, "elapsed_time": "1 day, 13:34:28", "remaining_time": "4:40:25", "throughput": 332.97, "total_tokens": 45040032} {"current_steps": 35580, "total_steps": 40000, "loss": 0.065, "lr": 0.008951880484595953, "epoch": 1.73847506901522, "percentage": 88.95, "elapsed_time": "1 day, 13:34:31", "remaining_time": "4:40:04", "throughput": 333.01, "total_tokens": 45046464} {"current_steps": 35585, "total_steps": 40000, "loss": 0.0432, "lr": 0.008931846667202552, "epoch": 1.7387193706789144, "percentage": 88.96, "elapsed_time": "1 day, 13:34:34", "remaining_time": "4:39:43", "throughput": 333.05, "total_tokens": 45052992} {"current_steps": 35590, "total_steps": 40000, "loss": 0.0503, "lr": 0.008911834604291152, "epoch": 1.7389636723426087, "percentage": 88.98, "elapsed_time": "1 day, 13:34:37", "remaining_time": "4:39:22", "throughput": 333.09, "total_tokens": 45059520} {"current_steps": 35595, "total_steps": 40000, "loss": 0.0457, "lr": 0.008891844298947882, "epoch": 1.7392079740063031, "percentage": 88.99, "elapsed_time": "1 day, 13:34:40", "remaining_time": "4:39:01", "throughput": 333.13, "total_tokens": 45065888} {"current_steps": 35600, "total_steps": 40000, "loss": 0.0478, "lr": 0.008871875754255508, "epoch": 1.7394522756699973, "percentage": 89.0, "elapsed_time": "1 day, 13:34:43", "remaining_time": "4:38:40", "throughput": 333.17, "total_tokens": 45072416} {"current_steps": 35600, "total_steps": 40000, "eval_loss": 0.060643330216407776, "epoch": 1.7394522756699973, "percentage": 89.0, "elapsed_time": "1 day, 13:45:17", "remaining_time": "4:39:58", "throughput": 331.62, "total_tokens": 45072416} {"current_steps": 35605, "total_steps": 40000, "loss": 0.0777, "lr": 0.008851928973293422, "epoch": 1.7396965773336917, "percentage": 89.01, "elapsed_time": "1 day, 13:45:21", "remaining_time": "4:39:37", "throughput": 331.66, "total_tokens": 45078976} {"current_steps": 35610, "total_steps": 40000, "loss": 0.0707, "lr": 0.00883200395913764, "epoch": 1.7399408789973858, "percentage": 89.03, "elapsed_time": "1 day, 13:45:24", "remaining_time": "4:39:16", "throughput": 331.7, "total_tokens": 45085440} {"current_steps": 35615, "total_steps": 40000, "loss": 0.0558, "lr": 0.00881210071486091, "epoch": 1.7401851806610802, "percentage": 89.04, "elapsed_time": "1 day, 13:45:27", "remaining_time": "4:38:55", "throughput": 331.74, "total_tokens": 45092096} {"current_steps": 35620, "total_steps": 40000, "loss": 0.1021, "lr": 0.008792219243532505, "epoch": 1.7404294823247746, "percentage": 89.05, "elapsed_time": "1 day, 13:45:30", "remaining_time": "4:38:34", "throughput": 331.78, "total_tokens": 45098496} {"current_steps": 35625, "total_steps": 40000, "loss": 0.0476, "lr": 0.008772359548218428, "epoch": 1.740673783988469, "percentage": 89.06, "elapsed_time": "1 day, 13:45:33", "remaining_time": "4:38:13", "throughput": 331.82, "total_tokens": 45105024} {"current_steps": 35630, "total_steps": 40000, "loss": 0.0457, "lr": 0.008752521631981274, "epoch": 1.7409180856521633, "percentage": 89.08, "elapsed_time": "1 day, 13:45:36", "remaining_time": "4:37:52", "throughput": 331.86, "total_tokens": 45111424} {"current_steps": 35635, "total_steps": 40000, "loss": 0.0843, "lr": 0.008732705497880315, "epoch": 1.7411623873158577, "percentage": 89.09, "elapsed_time": "1 day, 13:45:39", "remaining_time": "4:37:31", "throughput": 331.9, "total_tokens": 45117760} {"current_steps": 35640, "total_steps": 40000, "loss": 0.0478, "lr": 0.008712911148971459, "epoch": 1.741406688979552, "percentage": 89.1, "elapsed_time": "1 day, 13:45:42", "remaining_time": "4:37:10", "throughput": 331.93, "total_tokens": 45124000} {"current_steps": 35645, "total_steps": 40000, "loss": 0.0561, "lr": 0.008693138588307208, "epoch": 1.7416509906432462, "percentage": 89.11, "elapsed_time": "1 day, 13:45:45", "remaining_time": "4:36:49", "throughput": 331.97, "total_tokens": 45130208} {"current_steps": 35650, "total_steps": 40000, "loss": 0.0468, "lr": 0.008673387818936762, "epoch": 1.7418952923069406, "percentage": 89.12, "elapsed_time": "1 day, 13:45:48", "remaining_time": "4:36:28", "throughput": 332.01, "total_tokens": 45136192} {"current_steps": 35655, "total_steps": 40000, "loss": 0.0511, "lr": 0.008653658843905948, "epoch": 1.7421395939706348, "percentage": 89.14, "elapsed_time": "1 day, 13:45:51", "remaining_time": "4:36:07", "throughput": 332.05, "total_tokens": 45142560} {"current_steps": 35660, "total_steps": 40000, "loss": 0.0524, "lr": 0.0086339516662572, "epoch": 1.7423838956343292, "percentage": 89.15, "elapsed_time": "1 day, 13:45:55", "remaining_time": "4:35:46", "throughput": 332.09, "total_tokens": 45148896} {"current_steps": 35665, "total_steps": 40000, "loss": 0.0542, "lr": 0.008614266289029638, "epoch": 1.7426281972980235, "percentage": 89.16, "elapsed_time": "1 day, 13:45:58", "remaining_time": "4:35:25", "throughput": 332.13, "total_tokens": 45155456} {"current_steps": 35670, "total_steps": 40000, "loss": 0.0634, "lr": 0.008594602715258965, "epoch": 1.742872498961718, "percentage": 89.18, "elapsed_time": "1 day, 13:46:01", "remaining_time": "4:35:04", "throughput": 332.17, "total_tokens": 45161696} {"current_steps": 35675, "total_steps": 40000, "loss": 0.0555, "lr": 0.008574960947977573, "epoch": 1.7431168006254123, "percentage": 89.19, "elapsed_time": "1 day, 13:46:04", "remaining_time": "4:34:43", "throughput": 332.21, "total_tokens": 45168640} {"current_steps": 35680, "total_steps": 40000, "loss": 0.0612, "lr": 0.008555340990214438, "epoch": 1.7433611022891067, "percentage": 89.2, "elapsed_time": "1 day, 13:46:07", "remaining_time": "4:34:22", "throughput": 332.25, "total_tokens": 45175136} {"current_steps": 35685, "total_steps": 40000, "loss": 0.0472, "lr": 0.008535742844995258, "epoch": 1.743605403952801, "percentage": 89.21, "elapsed_time": "1 day, 13:46:10", "remaining_time": "4:34:01", "throughput": 332.29, "total_tokens": 45181824} {"current_steps": 35690, "total_steps": 40000, "loss": 0.0658, "lr": 0.008516166515342266, "epoch": 1.7438497056164952, "percentage": 89.22, "elapsed_time": "1 day, 13:46:13", "remaining_time": "4:33:40", "throughput": 332.33, "total_tokens": 45188192} {"current_steps": 35695, "total_steps": 40000, "loss": 0.0557, "lr": 0.008496612004274411, "epoch": 1.7440940072801896, "percentage": 89.24, "elapsed_time": "1 day, 13:46:16", "remaining_time": "4:33:19", "throughput": 332.37, "total_tokens": 45194528} {"current_steps": 35700, "total_steps": 40000, "loss": 0.0504, "lr": 0.008477079314807201, "epoch": 1.7443383089438838, "percentage": 89.25, "elapsed_time": "1 day, 13:46:19", "remaining_time": "4:32:58", "throughput": 332.41, "total_tokens": 45201152} {"current_steps": 35705, "total_steps": 40000, "loss": 0.0529, "lr": 0.008457568449952874, "epoch": 1.7445826106075781, "percentage": 89.26, "elapsed_time": "1 day, 13:46:22", "remaining_time": "4:32:37", "throughput": 332.45, "total_tokens": 45207200} {"current_steps": 35710, "total_steps": 40000, "loss": 0.0528, "lr": 0.008438079412720189, "epoch": 1.7448269122712725, "percentage": 89.28, "elapsed_time": "1 day, 13:46:26", "remaining_time": "4:32:16", "throughput": 332.49, "total_tokens": 45213664} {"current_steps": 35715, "total_steps": 40000, "loss": 0.0465, "lr": 0.00841861220611466, "epoch": 1.745071213934967, "percentage": 89.29, "elapsed_time": "1 day, 13:46:29", "remaining_time": "4:31:55", "throughput": 332.53, "total_tokens": 45220416} {"current_steps": 35720, "total_steps": 40000, "loss": 0.0508, "lr": 0.008399166833138355, "epoch": 1.7453155155986613, "percentage": 89.3, "elapsed_time": "1 day, 13:46:32", "remaining_time": "4:31:34", "throughput": 332.57, "total_tokens": 45226656} {"current_steps": 35725, "total_steps": 40000, "loss": 0.0521, "lr": 0.008379743296789987, "epoch": 1.7455598172623557, "percentage": 89.31, "elapsed_time": "1 day, 13:46:35", "remaining_time": "4:31:13", "throughput": 332.61, "total_tokens": 45232864} {"current_steps": 35730, "total_steps": 40000, "loss": 0.0638, "lr": 0.008360341600064896, "epoch": 1.74580411892605, "percentage": 89.33, "elapsed_time": "1 day, 13:46:38", "remaining_time": "4:30:52", "throughput": 332.65, "total_tokens": 45239776} {"current_steps": 35735, "total_steps": 40000, "loss": 0.0291, "lr": 0.008340961745955121, "epoch": 1.7460484205897442, "percentage": 89.34, "elapsed_time": "1 day, 13:46:41", "remaining_time": "4:30:31", "throughput": 332.69, "total_tokens": 45246112} {"current_steps": 35740, "total_steps": 40000, "loss": 0.0462, "lr": 0.008321603737449224, "epoch": 1.7462927222534386, "percentage": 89.35, "elapsed_time": "1 day, 13:46:44", "remaining_time": "4:30:10", "throughput": 332.73, "total_tokens": 45252896} {"current_steps": 35745, "total_steps": 40000, "loss": 0.0369, "lr": 0.008302267577532479, "epoch": 1.7465370239171327, "percentage": 89.36, "elapsed_time": "1 day, 13:46:47", "remaining_time": "4:29:50", "throughput": 332.77, "total_tokens": 45259008} {"current_steps": 35750, "total_steps": 40000, "loss": 0.0325, "lr": 0.008282953269186771, "epoch": 1.746781325580827, "percentage": 89.38, "elapsed_time": "1 day, 13:46:50", "remaining_time": "4:29:29", "throughput": 332.81, "total_tokens": 45265408} {"current_steps": 35755, "total_steps": 40000, "loss": 0.042, "lr": 0.008263660815390567, "epoch": 1.7470256272445215, "percentage": 89.39, "elapsed_time": "1 day, 13:46:54", "remaining_time": "4:29:08", "throughput": 332.85, "total_tokens": 45271680} {"current_steps": 35760, "total_steps": 40000, "loss": 0.0488, "lr": 0.008244390219119069, "epoch": 1.7472699289082159, "percentage": 89.4, "elapsed_time": "1 day, 13:46:57", "remaining_time": "4:28:47", "throughput": 332.89, "total_tokens": 45278528} {"current_steps": 35765, "total_steps": 40000, "loss": 0.0504, "lr": 0.008225141483343967, "epoch": 1.7475142305719102, "percentage": 89.41, "elapsed_time": "1 day, 13:47:00", "remaining_time": "4:28:26", "throughput": 332.93, "total_tokens": 45284576} {"current_steps": 35770, "total_steps": 40000, "loss": 0.0588, "lr": 0.00820591461103372, "epoch": 1.7477585322356046, "percentage": 89.42, "elapsed_time": "1 day, 13:47:03", "remaining_time": "4:28:05", "throughput": 332.96, "total_tokens": 45290976} {"current_steps": 35775, "total_steps": 40000, "loss": 0.0288, "lr": 0.008186709605153358, "epoch": 1.748002833899299, "percentage": 89.44, "elapsed_time": "1 day, 13:47:06", "remaining_time": "4:27:44", "throughput": 333.0, "total_tokens": 45297344} {"current_steps": 35780, "total_steps": 40000, "loss": 0.0627, "lr": 0.008167526468664492, "epoch": 1.7482471355629932, "percentage": 89.45, "elapsed_time": "1 day, 13:47:09", "remaining_time": "4:27:23", "throughput": 333.04, "total_tokens": 45303936} {"current_steps": 35785, "total_steps": 40000, "loss": 0.0527, "lr": 0.008148365204525443, "epoch": 1.7484914372266875, "percentage": 89.46, "elapsed_time": "1 day, 13:47:12", "remaining_time": "4:27:02", "throughput": 333.09, "total_tokens": 45310528} {"current_steps": 35790, "total_steps": 40000, "loss": 0.0433, "lr": 0.00812922581569106, "epoch": 1.7487357388903817, "percentage": 89.48, "elapsed_time": "1 day, 13:47:15", "remaining_time": "4:26:41", "throughput": 333.13, "total_tokens": 45317440} {"current_steps": 35795, "total_steps": 40000, "loss": 0.0448, "lr": 0.008110108305112934, "epoch": 1.748980040554076, "percentage": 89.49, "elapsed_time": "1 day, 13:47:18", "remaining_time": "4:26:21", "throughput": 333.17, "total_tokens": 45323936} {"current_steps": 35800, "total_steps": 40000, "loss": 0.0743, "lr": 0.008091012675739223, "epoch": 1.7492243422177705, "percentage": 89.5, "elapsed_time": "1 day, 13:47:21", "remaining_time": "4:26:00", "throughput": 333.21, "total_tokens": 45330336} {"current_steps": 35800, "total_steps": 40000, "eval_loss": 0.06081436946988106, "epoch": 1.7492243422177705, "percentage": 89.5, "elapsed_time": "1 day, 13:57:55", "remaining_time": "4:27:14", "throughput": 331.66, "total_tokens": 45330336} {"current_steps": 35805, "total_steps": 40000, "loss": 0.0767, "lr": 0.008071938930514671, "epoch": 1.7494686438814648, "percentage": 89.51, "elapsed_time": "1 day, 13:57:59", "remaining_time": "4:26:53", "throughput": 331.7, "total_tokens": 45336896} {"current_steps": 35810, "total_steps": 40000, "loss": 0.0593, "lr": 0.008052887072380726, "epoch": 1.7497129455451592, "percentage": 89.53, "elapsed_time": "1 day, 13:58:02", "remaining_time": "4:26:32", "throughput": 331.74, "total_tokens": 45343296} {"current_steps": 35815, "total_steps": 40000, "loss": 0.0612, "lr": 0.008033857104275437, "epoch": 1.7499572472088536, "percentage": 89.54, "elapsed_time": "1 day, 13:58:06", "remaining_time": "4:26:11", "throughput": 331.78, "total_tokens": 45349728} {"current_steps": 35820, "total_steps": 40000, "loss": 0.0543, "lr": 0.008014849029133424, "epoch": 1.750201548872548, "percentage": 89.55, "elapsed_time": "1 day, 13:58:09", "remaining_time": "4:25:50", "throughput": 331.82, "total_tokens": 45355552} {"current_steps": 35825, "total_steps": 40000, "loss": 0.0654, "lr": 0.007995862849885975, "epoch": 1.7504458505362421, "percentage": 89.56, "elapsed_time": "1 day, 13:58:12", "remaining_time": "4:25:29", "throughput": 331.86, "total_tokens": 45361984} {"current_steps": 35830, "total_steps": 40000, "loss": 0.0861, "lr": 0.007976898569461032, "epoch": 1.7506901521999365, "percentage": 89.58, "elapsed_time": "1 day, 13:58:15", "remaining_time": "4:25:08", "throughput": 331.89, "total_tokens": 45367968} {"current_steps": 35835, "total_steps": 40000, "loss": 0.0486, "lr": 0.007957956190783088, "epoch": 1.7509344538636307, "percentage": 89.59, "elapsed_time": "1 day, 13:58:18", "remaining_time": "4:24:48", "throughput": 331.93, "total_tokens": 45374240} {"current_steps": 35840, "total_steps": 40000, "loss": 0.0597, "lr": 0.007939035716773324, "epoch": 1.751178755527325, "percentage": 89.6, "elapsed_time": "1 day, 13:58:21", "remaining_time": "4:24:27", "throughput": 331.97, "total_tokens": 45380608} {"current_steps": 35845, "total_steps": 40000, "loss": 0.0568, "lr": 0.007920137150349487, "epoch": 1.7514230571910194, "percentage": 89.61, "elapsed_time": "1 day, 13:58:24", "remaining_time": "4:24:06", "throughput": 332.01, "total_tokens": 45386912} {"current_steps": 35850, "total_steps": 40000, "loss": 0.0563, "lr": 0.007901260494425981, "epoch": 1.7516673588547138, "percentage": 89.62, "elapsed_time": "1 day, 13:58:27", "remaining_time": "4:23:45", "throughput": 332.05, "total_tokens": 45393312} {"current_steps": 35855, "total_steps": 40000, "loss": 0.0509, "lr": 0.007882405751913861, "epoch": 1.7519116605184082, "percentage": 89.64, "elapsed_time": "1 day, 13:58:30", "remaining_time": "4:23:24", "throughput": 332.09, "total_tokens": 45399712} {"current_steps": 35860, "total_steps": 40000, "loss": 0.0357, "lr": 0.007863572925720702, "epoch": 1.7521559621821026, "percentage": 89.65, "elapsed_time": "1 day, 13:58:33", "remaining_time": "4:23:03", "throughput": 332.13, "total_tokens": 45405984} {"current_steps": 35865, "total_steps": 40000, "loss": 0.1026, "lr": 0.007844762018750827, "epoch": 1.752400263845797, "percentage": 89.66, "elapsed_time": "1 day, 13:58:36", "remaining_time": "4:22:42", "throughput": 332.16, "total_tokens": 45411904} {"current_steps": 35870, "total_steps": 40000, "loss": 0.0562, "lr": 0.007825973033905054, "epoch": 1.752644565509491, "percentage": 89.68, "elapsed_time": "1 day, 13:58:39", "remaining_time": "4:22:21", "throughput": 332.2, "total_tokens": 45418656} {"current_steps": 35875, "total_steps": 40000, "loss": 0.0359, "lr": 0.007807205974080927, "epoch": 1.7528888671731855, "percentage": 89.69, "elapsed_time": "1 day, 13:58:42", "remaining_time": "4:22:00", "throughput": 332.24, "total_tokens": 45425280} {"current_steps": 35880, "total_steps": 40000, "loss": 0.077, "lr": 0.007788460842172551, "epoch": 1.7531331688368796, "percentage": 89.7, "elapsed_time": "1 day, 13:58:45", "remaining_time": "4:21:39", "throughput": 332.28, "total_tokens": 45431776} {"current_steps": 35885, "total_steps": 40000, "loss": 0.0481, "lr": 0.0077697376410706285, "epoch": 1.753377470500574, "percentage": 89.71, "elapsed_time": "1 day, 13:58:48", "remaining_time": "4:21:18", "throughput": 332.32, "total_tokens": 45438272} {"current_steps": 35890, "total_steps": 40000, "loss": 0.0646, "lr": 0.007751036373662567, "epoch": 1.7536217721642684, "percentage": 89.72, "elapsed_time": "1 day, 13:58:51", "remaining_time": "4:20:58", "throughput": 332.36, "total_tokens": 45444576} {"current_steps": 35895, "total_steps": 40000, "loss": 0.0907, "lr": 0.00773235704283231, "epoch": 1.7538660738279628, "percentage": 89.74, "elapsed_time": "1 day, 13:58:54", "remaining_time": "4:20:37", "throughput": 332.4, "total_tokens": 45450688} {"current_steps": 35900, "total_steps": 40000, "loss": 0.0433, "lr": 0.007713699651460437, "epoch": 1.7541103754916572, "percentage": 89.75, "elapsed_time": "1 day, 13:58:58", "remaining_time": "4:20:16", "throughput": 332.44, "total_tokens": 45457440} {"current_steps": 35905, "total_steps": 40000, "loss": 0.0561, "lr": 0.007695064202424162, "epoch": 1.7543546771553515, "percentage": 89.76, "elapsed_time": "1 day, 13:59:01", "remaining_time": "4:19:55", "throughput": 332.48, "total_tokens": 45463552} {"current_steps": 35910, "total_steps": 40000, "loss": 0.0509, "lr": 0.007676450698597286, "epoch": 1.754598978819046, "percentage": 89.78, "elapsed_time": "1 day, 13:59:04", "remaining_time": "4:19:34", "throughput": 332.52, "total_tokens": 45469984} {"current_steps": 35915, "total_steps": 40000, "loss": 0.0322, "lr": 0.007657859142850265, "epoch": 1.75484328048274, "percentage": 89.79, "elapsed_time": "1 day, 13:59:07", "remaining_time": "4:19:13", "throughput": 332.56, "total_tokens": 45476288} {"current_steps": 35920, "total_steps": 40000, "loss": 0.0508, "lr": 0.0076392895380501535, "epoch": 1.7550875821464345, "percentage": 89.8, "elapsed_time": "1 day, 13:59:10", "remaining_time": "4:18:52", "throughput": 332.6, "total_tokens": 45482784} {"current_steps": 35925, "total_steps": 40000, "loss": 0.0541, "lr": 0.007620741887060611, "epoch": 1.7553318838101286, "percentage": 89.81, "elapsed_time": "1 day, 13:59:13", "remaining_time": "4:18:32", "throughput": 332.64, "total_tokens": 45489088} {"current_steps": 35930, "total_steps": 40000, "loss": 0.0711, "lr": 0.007602216192741901, "epoch": 1.755576185473823, "percentage": 89.83, "elapsed_time": "1 day, 13:59:16", "remaining_time": "4:18:11", "throughput": 332.67, "total_tokens": 45495360} {"current_steps": 35935, "total_steps": 40000, "loss": 0.0412, "lr": 0.007583712457950969, "epoch": 1.7558204871375174, "percentage": 89.84, "elapsed_time": "1 day, 13:59:19", "remaining_time": "4:17:50", "throughput": 332.71, "total_tokens": 45501536} {"current_steps": 35940, "total_steps": 40000, "loss": 0.0516, "lr": 0.007565230685541269, "epoch": 1.7560647888012118, "percentage": 89.85, "elapsed_time": "1 day, 13:59:22", "remaining_time": "4:17:29", "throughput": 332.75, "total_tokens": 45507488} {"current_steps": 35945, "total_steps": 40000, "loss": 0.0906, "lr": 0.007546770878362968, "epoch": 1.7563090904649061, "percentage": 89.86, "elapsed_time": "1 day, 13:59:25", "remaining_time": "4:17:08", "throughput": 332.78, "total_tokens": 45513504} {"current_steps": 35950, "total_steps": 40000, "loss": 0.0474, "lr": 0.0075283330392627405, "epoch": 1.7565533921286005, "percentage": 89.88, "elapsed_time": "1 day, 13:59:28", "remaining_time": "4:16:47", "throughput": 332.82, "total_tokens": 45520032} {"current_steps": 35955, "total_steps": 40000, "loss": 0.0421, "lr": 0.007509917171083979, "epoch": 1.756797693792295, "percentage": 89.89, "elapsed_time": "1 day, 13:59:32", "remaining_time": "4:16:27", "throughput": 332.87, "total_tokens": 45527200} {"current_steps": 35960, "total_steps": 40000, "loss": 0.0651, "lr": 0.007491523276666662, "epoch": 1.757041995455989, "percentage": 89.9, "elapsed_time": "1 day, 13:59:35", "remaining_time": "4:16:06", "throughput": 332.91, "total_tokens": 45533376} {"current_steps": 35965, "total_steps": 40000, "loss": 0.062, "lr": 0.007473151358847318, "epoch": 1.7572862971196834, "percentage": 89.91, "elapsed_time": "1 day, 13:59:38", "remaining_time": "4:15:45", "throughput": 332.95, "total_tokens": 45539872} {"current_steps": 35970, "total_steps": 40000, "loss": 0.0498, "lr": 0.007454801420459117, "epoch": 1.7575305987833776, "percentage": 89.92, "elapsed_time": "1 day, 13:59:41", "remaining_time": "4:15:24", "throughput": 332.99, "total_tokens": 45546688} {"current_steps": 35975, "total_steps": 40000, "loss": 0.0495, "lr": 0.0074364734643319105, "epoch": 1.757774900447072, "percentage": 89.94, "elapsed_time": "1 day, 13:59:44", "remaining_time": "4:15:03", "throughput": 333.03, "total_tokens": 45553184} {"current_steps": 35980, "total_steps": 40000, "loss": 0.053, "lr": 0.007418167493292022, "epoch": 1.7580192021107663, "percentage": 89.95, "elapsed_time": "1 day, 13:59:47", "remaining_time": "4:14:43", "throughput": 333.07, "total_tokens": 45559904} {"current_steps": 35985, "total_steps": 40000, "loss": 0.0571, "lr": 0.0073998835101625245, "epoch": 1.7582635037744607, "percentage": 89.96, "elapsed_time": "1 day, 13:59:50", "remaining_time": "4:14:22", "throughput": 333.11, "total_tokens": 45565920} {"current_steps": 35990, "total_steps": 40000, "loss": 0.0463, "lr": 0.007381621517762998, "epoch": 1.758507805438155, "percentage": 89.98, "elapsed_time": "1 day, 13:59:53", "remaining_time": "4:14:01", "throughput": 333.14, "total_tokens": 45572000} {"current_steps": 35995, "total_steps": 40000, "loss": 0.0272, "lr": 0.007363381518909689, "epoch": 1.7587521071018495, "percentage": 89.99, "elapsed_time": "1 day, 13:59:56", "remaining_time": "4:13:40", "throughput": 333.18, "total_tokens": 45578368} {"current_steps": 36000, "total_steps": 40000, "loss": 0.053, "lr": 0.007345163516415448, "epoch": 1.7589964087655436, "percentage": 90.0, "elapsed_time": "1 day, 13:59:59", "remaining_time": "4:13:19", "throughput": 333.22, "total_tokens": 45584800} {"current_steps": 36000, "total_steps": 40000, "eval_loss": 0.06068667024374008, "epoch": 1.7589964087655436, "percentage": 90.0, "elapsed_time": "1 day, 14:10:34", "remaining_time": "4:14:30", "throughput": 331.68, "total_tokens": 45584800} {"current_steps": 36005, "total_steps": 40000, "loss": 0.0517, "lr": 0.007326967513089693, "epoch": 1.759240710429238, "percentage": 90.01, "elapsed_time": "1 day, 14:10:38", "remaining_time": "4:14:09", "throughput": 331.72, "total_tokens": 45591040} {"current_steps": 36010, "total_steps": 40000, "loss": 0.0455, "lr": 0.0073087935117384815, "epoch": 1.7594850120929324, "percentage": 90.03, "elapsed_time": "1 day, 14:10:41", "remaining_time": "4:13:48", "throughput": 331.76, "total_tokens": 45597152} {"current_steps": 36015, "total_steps": 40000, "loss": 0.0482, "lr": 0.007290641515164503, "epoch": 1.7597293137566266, "percentage": 90.04, "elapsed_time": "1 day, 14:10:44", "remaining_time": "4:13:27", "throughput": 331.8, "total_tokens": 45603360} {"current_steps": 36020, "total_steps": 40000, "loss": 0.0469, "lr": 0.007272511526166986, "epoch": 1.759973615420321, "percentage": 90.05, "elapsed_time": "1 day, 14:10:47", "remaining_time": "4:13:07", "throughput": 331.84, "total_tokens": 45610080} {"current_steps": 36025, "total_steps": 40000, "loss": 0.0694, "lr": 0.0072544035475418265, "epoch": 1.7602179170840153, "percentage": 90.06, "elapsed_time": "1 day, 14:10:50", "remaining_time": "4:12:46", "throughput": 331.87, "total_tokens": 45616384} {"current_steps": 36030, "total_steps": 40000, "loss": 0.0399, "lr": 0.007236317582081475, "epoch": 1.7604622187477097, "percentage": 90.08, "elapsed_time": "1 day, 14:10:53", "remaining_time": "4:12:25", "throughput": 331.91, "total_tokens": 45622880} {"current_steps": 36035, "total_steps": 40000, "loss": 0.0707, "lr": 0.007218253632575066, "epoch": 1.760706520411404, "percentage": 90.09, "elapsed_time": "1 day, 14:10:56", "remaining_time": "4:12:04", "throughput": 331.95, "total_tokens": 45629216} {"current_steps": 36040, "total_steps": 40000, "loss": 0.058, "lr": 0.007200211701808223, "epoch": 1.7609508220750985, "percentage": 90.1, "elapsed_time": "1 day, 14:10:59", "remaining_time": "4:11:43", "throughput": 331.99, "total_tokens": 45635392} {"current_steps": 36045, "total_steps": 40000, "loss": 0.0409, "lr": 0.007182191792563286, "epoch": 1.7611951237387926, "percentage": 90.11, "elapsed_time": "1 day, 14:11:02", "remaining_time": "4:11:22", "throughput": 332.03, "total_tokens": 45642080} {"current_steps": 36050, "total_steps": 40000, "loss": 0.0449, "lr": 0.0071641939076191145, "epoch": 1.761439425402487, "percentage": 90.12, "elapsed_time": "1 day, 14:11:05", "remaining_time": "4:11:02", "throughput": 332.07, "total_tokens": 45648224} {"current_steps": 36055, "total_steps": 40000, "loss": 0.0323, "lr": 0.007146218049751257, "epoch": 1.7616837270661814, "percentage": 90.14, "elapsed_time": "1 day, 14:11:09", "remaining_time": "4:10:41", "throughput": 332.11, "total_tokens": 45654848} {"current_steps": 36060, "total_steps": 40000, "loss": 0.0649, "lr": 0.0071282642217317775, "epoch": 1.7619280287298755, "percentage": 90.15, "elapsed_time": "1 day, 14:11:12", "remaining_time": "4:10:20", "throughput": 332.15, "total_tokens": 45661152} {"current_steps": 36065, "total_steps": 40000, "loss": 0.0766, "lr": 0.007110332426329396, "epoch": 1.76217233039357, "percentage": 90.16, "elapsed_time": "1 day, 14:11:15", "remaining_time": "4:09:59", "throughput": 332.19, "total_tokens": 45667200} {"current_steps": 36070, "total_steps": 40000, "loss": 0.0465, "lr": 0.007092422666309417, "epoch": 1.7624166320572643, "percentage": 90.18, "elapsed_time": "1 day, 14:11:18", "remaining_time": "4:09:38", "throughput": 332.23, "total_tokens": 45673952} {"current_steps": 36075, "total_steps": 40000, "loss": 0.0403, "lr": 0.0070745349444337295, "epoch": 1.7626609337209587, "percentage": 90.19, "elapsed_time": "1 day, 14:11:21", "remaining_time": "4:09:18", "throughput": 332.26, "total_tokens": 45680096} {"current_steps": 36080, "total_steps": 40000, "loss": 0.0486, "lr": 0.007056669263460913, "epoch": 1.762905235384653, "percentage": 90.2, "elapsed_time": "1 day, 14:11:24", "remaining_time": "4:08:57", "throughput": 332.3, "total_tokens": 45686240} {"current_steps": 36085, "total_steps": 40000, "loss": 0.0328, "lr": 0.007038825626145995, "epoch": 1.7631495370483474, "percentage": 90.21, "elapsed_time": "1 day, 14:11:27", "remaining_time": "4:08:36", "throughput": 332.34, "total_tokens": 45692832} {"current_steps": 36090, "total_steps": 40000, "loss": 0.0599, "lr": 0.007021004035240724, "epoch": 1.7633938387120416, "percentage": 90.22, "elapsed_time": "1 day, 14:11:30", "remaining_time": "4:08:15", "throughput": 332.38, "total_tokens": 45699200} {"current_steps": 36095, "total_steps": 40000, "loss": 0.0541, "lr": 0.007003204493493453, "epoch": 1.763638140375736, "percentage": 90.24, "elapsed_time": "1 day, 14:11:33", "remaining_time": "4:07:55", "throughput": 332.42, "total_tokens": 45705696} {"current_steps": 36100, "total_steps": 40000, "loss": 0.0524, "lr": 0.006985427003649036, "epoch": 1.7638824420394303, "percentage": 90.25, "elapsed_time": "1 day, 14:11:36", "remaining_time": "4:07:34", "throughput": 332.46, "total_tokens": 45711776} {"current_steps": 36105, "total_steps": 40000, "loss": 0.0343, "lr": 0.006967671568449013, "epoch": 1.7641267437031245, "percentage": 90.26, "elapsed_time": "1 day, 14:11:40", "remaining_time": "4:07:13", "throughput": 332.5, "total_tokens": 45718304} {"current_steps": 36110, "total_steps": 40000, "loss": 0.0565, "lr": 0.006949938190631511, "epoch": 1.7643710453668189, "percentage": 90.28, "elapsed_time": "1 day, 14:11:43", "remaining_time": "4:06:52", "throughput": 332.54, "total_tokens": 45724800} {"current_steps": 36115, "total_steps": 40000, "loss": 0.0427, "lr": 0.0069322268729311905, "epoch": 1.7646153470305133, "percentage": 90.29, "elapsed_time": "1 day, 14:11:46", "remaining_time": "4:06:31", "throughput": 332.58, "total_tokens": 45732128} {"current_steps": 36120, "total_steps": 40000, "loss": 0.0496, "lr": 0.006914537618079403, "epoch": 1.7648596486942076, "percentage": 90.3, "elapsed_time": "1 day, 14:11:49", "remaining_time": "4:06:11", "throughput": 332.62, "total_tokens": 45738016} {"current_steps": 36125, "total_steps": 40000, "loss": 0.0729, "lr": 0.006896870428804031, "epoch": 1.765103950357902, "percentage": 90.31, "elapsed_time": "1 day, 14:11:52", "remaining_time": "4:05:50", "throughput": 332.66, "total_tokens": 45744800} {"current_steps": 36130, "total_steps": 40000, "loss": 0.0642, "lr": 0.006879225307829595, "epoch": 1.7653482520215964, "percentage": 90.33, "elapsed_time": "1 day, 14:11:55", "remaining_time": "4:05:29", "throughput": 332.7, "total_tokens": 45751360} {"current_steps": 36135, "total_steps": 40000, "loss": 0.0554, "lr": 0.00686160225787717, "epoch": 1.7655925536852906, "percentage": 90.34, "elapsed_time": "1 day, 14:11:58", "remaining_time": "4:05:09", "throughput": 332.73, "total_tokens": 45757120} {"current_steps": 36140, "total_steps": 40000, "loss": 0.0355, "lr": 0.006844001281664463, "epoch": 1.765836855348985, "percentage": 90.35, "elapsed_time": "1 day, 14:12:01", "remaining_time": "4:04:48", "throughput": 332.77, "total_tokens": 45763808} {"current_steps": 36145, "total_steps": 40000, "loss": 0.0459, "lr": 0.006826422381905789, "epoch": 1.766081157012679, "percentage": 90.36, "elapsed_time": "1 day, 14:12:04", "remaining_time": "4:04:27", "throughput": 332.81, "total_tokens": 45770304} {"current_steps": 36150, "total_steps": 40000, "loss": 0.0663, "lr": 0.006808865561311994, "epoch": 1.7663254586763735, "percentage": 90.38, "elapsed_time": "1 day, 14:12:07", "remaining_time": "4:04:06", "throughput": 332.85, "total_tokens": 45776576} {"current_steps": 36155, "total_steps": 40000, "loss": 0.0681, "lr": 0.00679133082259058, "epoch": 1.7665697603400679, "percentage": 90.39, "elapsed_time": "1 day, 14:12:11", "remaining_time": "4:03:46", "throughput": 332.89, "total_tokens": 45783104} {"current_steps": 36160, "total_steps": 40000, "loss": 0.0647, "lr": 0.00677381816844565, "epoch": 1.7668140620037622, "percentage": 90.4, "elapsed_time": "1 day, 14:12:14", "remaining_time": "4:03:25", "throughput": 332.93, "total_tokens": 45789216} {"current_steps": 36165, "total_steps": 40000, "loss": 0.0581, "lr": 0.0067563276015778434, "epoch": 1.7670583636674566, "percentage": 90.41, "elapsed_time": "1 day, 14:12:17", "remaining_time": "4:03:04", "throughput": 332.97, "total_tokens": 45795904} {"current_steps": 36170, "total_steps": 40000, "loss": 0.0403, "lr": 0.006738859124684437, "epoch": 1.767302665331151, "percentage": 90.42, "elapsed_time": "1 day, 14:12:20", "remaining_time": "4:02:43", "throughput": 333.01, "total_tokens": 45801920} {"current_steps": 36175, "total_steps": 40000, "loss": 0.0758, "lr": 0.006721412740459259, "epoch": 1.7675469669948454, "percentage": 90.44, "elapsed_time": "1 day, 14:12:23", "remaining_time": "4:02:23", "throughput": 333.04, "total_tokens": 45807872} {"current_steps": 36180, "total_steps": 40000, "loss": 0.0523, "lr": 0.006703988451592824, "epoch": 1.7677912686585395, "percentage": 90.45, "elapsed_time": "1 day, 14:12:26", "remaining_time": "4:02:02", "throughput": 333.08, "total_tokens": 45813664} {"current_steps": 36185, "total_steps": 40000, "loss": 0.0584, "lr": 0.006686586260772114, "epoch": 1.768035570322234, "percentage": 90.46, "elapsed_time": "1 day, 14:12:29", "remaining_time": "4:01:41", "throughput": 333.12, "total_tokens": 45820064} {"current_steps": 36190, "total_steps": 40000, "loss": 0.0899, "lr": 0.006669206170680819, "epoch": 1.768279871985928, "percentage": 90.48, "elapsed_time": "1 day, 14:12:32", "remaining_time": "4:01:21", "throughput": 333.16, "total_tokens": 45826752} {"current_steps": 36195, "total_steps": 40000, "loss": 0.0682, "lr": 0.0066518481839991095, "epoch": 1.7685241736496224, "percentage": 90.49, "elapsed_time": "1 day, 14:12:35", "remaining_time": "4:01:00", "throughput": 333.2, "total_tokens": 45832992} {"current_steps": 36200, "total_steps": 40000, "loss": 0.0727, "lr": 0.006634512303403861, "epoch": 1.7687684753133168, "percentage": 90.5, "elapsed_time": "1 day, 14:12:38", "remaining_time": "4:00:39", "throughput": 333.23, "total_tokens": 45838848} {"current_steps": 36200, "total_steps": 40000, "eval_loss": 0.06062329560518265, "epoch": 1.7687684753133168, "percentage": 90.5, "elapsed_time": "1 day, 14:23:12", "remaining_time": "4:01:46", "throughput": 331.7, "total_tokens": 45838848} {"current_steps": 36205, "total_steps": 40000, "loss": 0.0446, "lr": 0.0066171985315684355, "epoch": 1.7690127769770112, "percentage": 90.51, "elapsed_time": "1 day, 14:23:16", "remaining_time": "4:01:25", "throughput": 331.74, "total_tokens": 45844832} {"current_steps": 36210, "total_steps": 40000, "loss": 0.0648, "lr": 0.0065999068711628806, "epoch": 1.7692570786407056, "percentage": 90.53, "elapsed_time": "1 day, 14:23:19", "remaining_time": "4:01:04", "throughput": 331.78, "total_tokens": 45851360} {"current_steps": 36215, "total_steps": 40000, "loss": 0.0669, "lr": 0.0065826373248537295, "epoch": 1.7695013803044, "percentage": 90.54, "elapsed_time": "1 day, 14:23:22", "remaining_time": "4:00:44", "throughput": 331.82, "total_tokens": 45857952} {"current_steps": 36220, "total_steps": 40000, "loss": 0.0354, "lr": 0.006565389895304218, "epoch": 1.7697456819680943, "percentage": 90.55, "elapsed_time": "1 day, 14:23:26", "remaining_time": "4:00:23", "throughput": 331.86, "total_tokens": 45864608} {"current_steps": 36225, "total_steps": 40000, "loss": 0.043, "lr": 0.006548164585174104, "epoch": 1.7699899836317885, "percentage": 90.56, "elapsed_time": "1 day, 14:23:29", "remaining_time": "4:00:02", "throughput": 331.89, "total_tokens": 45870816} {"current_steps": 36230, "total_steps": 40000, "loss": 0.038, "lr": 0.006530961397119728, "epoch": 1.7702342852954829, "percentage": 90.58, "elapsed_time": "1 day, 14:23:32", "remaining_time": "3:59:42", "throughput": 331.93, "total_tokens": 45877152} {"current_steps": 36235, "total_steps": 40000, "loss": 0.0635, "lr": 0.00651378033379405, "epoch": 1.770478586959177, "percentage": 90.59, "elapsed_time": "1 day, 14:23:35", "remaining_time": "3:59:21", "throughput": 331.97, "total_tokens": 45883488} {"current_steps": 36240, "total_steps": 40000, "loss": 0.0501, "lr": 0.006496621397846619, "epoch": 1.7707228886228714, "percentage": 90.6, "elapsed_time": "1 day, 14:23:38", "remaining_time": "3:59:00", "throughput": 332.01, "total_tokens": 45889696} {"current_steps": 36245, "total_steps": 40000, "loss": 0.0429, "lr": 0.006479484591923518, "epoch": 1.7709671902865658, "percentage": 90.61, "elapsed_time": "1 day, 14:23:41", "remaining_time": "3:58:39", "throughput": 332.05, "total_tokens": 45896064} {"current_steps": 36250, "total_steps": 40000, "loss": 0.0624, "lr": 0.006462369918667515, "epoch": 1.7712114919502602, "percentage": 90.62, "elapsed_time": "1 day, 14:23:44", "remaining_time": "3:58:19", "throughput": 332.09, "total_tokens": 45902848} {"current_steps": 36255, "total_steps": 40000, "loss": 0.0907, "lr": 0.006445277380717851, "epoch": 1.7714557936139546, "percentage": 90.64, "elapsed_time": "1 day, 14:23:47", "remaining_time": "3:57:58", "throughput": 332.13, "total_tokens": 45908992} {"current_steps": 36260, "total_steps": 40000, "loss": 0.0656, "lr": 0.006428206980710466, "epoch": 1.771700095277649, "percentage": 90.65, "elapsed_time": "1 day, 14:23:50", "remaining_time": "3:57:37", "throughput": 332.16, "total_tokens": 45915104} {"current_steps": 36265, "total_steps": 40000, "loss": 0.0705, "lr": 0.006411158721277788, "epoch": 1.7719443969413433, "percentage": 90.66, "elapsed_time": "1 day, 14:23:53", "remaining_time": "3:57:16", "throughput": 332.2, "total_tokens": 45920704} {"current_steps": 36270, "total_steps": 40000, "loss": 0.0624, "lr": 0.00639413260504888, "epoch": 1.7721886986050375, "percentage": 90.67, "elapsed_time": "1 day, 14:23:56", "remaining_time": "3:56:56", "throughput": 332.24, "total_tokens": 45927264} {"current_steps": 36275, "total_steps": 40000, "loss": 0.0591, "lr": 0.006377128634649376, "epoch": 1.7724330002687319, "percentage": 90.69, "elapsed_time": "1 day, 14:23:59", "remaining_time": "3:56:35", "throughput": 332.27, "total_tokens": 45933312} {"current_steps": 36280, "total_steps": 40000, "loss": 0.0474, "lr": 0.006360146812701528, "epoch": 1.772677301932426, "percentage": 90.7, "elapsed_time": "1 day, 14:24:02", "remaining_time": "3:56:14", "throughput": 332.31, "total_tokens": 45939456} {"current_steps": 36285, "total_steps": 40000, "loss": 0.0574, "lr": 0.006343187141824125, "epoch": 1.7729216035961204, "percentage": 90.71, "elapsed_time": "1 day, 14:24:05", "remaining_time": "3:55:54", "throughput": 332.35, "total_tokens": 45946656} {"current_steps": 36290, "total_steps": 40000, "loss": 0.0276, "lr": 0.00632624962463259, "epoch": 1.7731659052598148, "percentage": 90.72, "elapsed_time": "1 day, 14:24:08", "remaining_time": "3:55:33", "throughput": 332.39, "total_tokens": 45953024} {"current_steps": 36295, "total_steps": 40000, "loss": 0.0568, "lr": 0.006309334263738853, "epoch": 1.7734102069235091, "percentage": 90.74, "elapsed_time": "1 day, 14:24:12", "remaining_time": "3:55:12", "throughput": 332.43, "total_tokens": 45959584} {"current_steps": 36300, "total_steps": 40000, "loss": 0.0408, "lr": 0.006292441061751508, "epoch": 1.7736545085872035, "percentage": 90.75, "elapsed_time": "1 day, 14:24:15", "remaining_time": "3:54:52", "throughput": 332.47, "total_tokens": 45965824} {"current_steps": 36305, "total_steps": 40000, "loss": 0.0511, "lr": 0.0062755700212757054, "epoch": 1.773898810250898, "percentage": 90.76, "elapsed_time": "1 day, 14:24:18", "remaining_time": "3:54:31", "throughput": 332.51, "total_tokens": 45971904} {"current_steps": 36310, "total_steps": 40000, "loss": 0.0614, "lr": 0.006258721144913148, "epoch": 1.7741431119145923, "percentage": 90.77, "elapsed_time": "1 day, 14:24:21", "remaining_time": "3:54:10", "throughput": 332.55, "total_tokens": 45978368} {"current_steps": 36315, "total_steps": 40000, "loss": 0.0591, "lr": 0.0062418944352621575, "epoch": 1.7743874135782864, "percentage": 90.79, "elapsed_time": "1 day, 14:24:24", "remaining_time": "3:53:50", "throughput": 332.58, "total_tokens": 45984512} {"current_steps": 36320, "total_steps": 40000, "loss": 0.0501, "lr": 0.0062250898949176405, "epoch": 1.7746317152419808, "percentage": 90.8, "elapsed_time": "1 day, 14:24:27", "remaining_time": "3:53:29", "throughput": 332.62, "total_tokens": 45990624} {"current_steps": 36325, "total_steps": 40000, "loss": 0.0579, "lr": 0.006208307526471041, "epoch": 1.774876016905675, "percentage": 90.81, "elapsed_time": "1 day, 14:24:30", "remaining_time": "3:53:08", "throughput": 332.66, "total_tokens": 45996832} {"current_steps": 36330, "total_steps": 40000, "loss": 0.0632, "lr": 0.006191547332510405, "epoch": 1.7751203185693694, "percentage": 90.83, "elapsed_time": "1 day, 14:24:33", "remaining_time": "3:52:48", "throughput": 332.7, "total_tokens": 46003008} {"current_steps": 36335, "total_steps": 40000, "loss": 0.0366, "lr": 0.006174809315620416, "epoch": 1.7753646202330637, "percentage": 90.84, "elapsed_time": "1 day, 14:24:36", "remaining_time": "3:52:27", "throughput": 332.73, "total_tokens": 46009120} {"current_steps": 36340, "total_steps": 40000, "loss": 0.0605, "lr": 0.00615809347838221, "epoch": 1.7756089218967581, "percentage": 90.85, "elapsed_time": "1 day, 14:24:39", "remaining_time": "3:52:06", "throughput": 332.77, "total_tokens": 46015552} {"current_steps": 36345, "total_steps": 40000, "loss": 0.0617, "lr": 0.006141399823373655, "epoch": 1.7758532235604525, "percentage": 90.86, "elapsed_time": "1 day, 14:24:42", "remaining_time": "3:51:46", "throughput": 332.81, "total_tokens": 46022016} {"current_steps": 36350, "total_steps": 40000, "loss": 0.0485, "lr": 0.0061247283531690455, "epoch": 1.7760975252241469, "percentage": 90.88, "elapsed_time": "1 day, 14:24:45", "remaining_time": "3:51:25", "throughput": 332.85, "total_tokens": 46027968} {"current_steps": 36355, "total_steps": 40000, "loss": 0.0585, "lr": 0.0061080790703393895, "epoch": 1.7763418268878413, "percentage": 90.89, "elapsed_time": "1 day, 14:24:48", "remaining_time": "3:51:05", "throughput": 332.89, "total_tokens": 46034304} {"current_steps": 36360, "total_steps": 40000, "loss": 0.0721, "lr": 0.006091451977452217, "epoch": 1.7765861285515354, "percentage": 90.9, "elapsed_time": "1 day, 14:24:51", "remaining_time": "3:50:44", "throughput": 332.92, "total_tokens": 46040768} {"current_steps": 36365, "total_steps": 40000, "loss": 0.0473, "lr": 0.00607484707707161, "epoch": 1.7768304302152298, "percentage": 90.91, "elapsed_time": "1 day, 14:24:54", "remaining_time": "3:50:23", "throughput": 332.96, "total_tokens": 46047360} {"current_steps": 36370, "total_steps": 40000, "loss": 0.0973, "lr": 0.006058264371758254, "epoch": 1.777074731878924, "percentage": 90.92, "elapsed_time": "1 day, 14:24:58", "remaining_time": "3:50:03", "throughput": 333.0, "total_tokens": 46053728} {"current_steps": 36375, "total_steps": 40000, "loss": 0.0591, "lr": 0.00604170386406942, "epoch": 1.7773190335426183, "percentage": 90.94, "elapsed_time": "1 day, 14:25:01", "remaining_time": "3:49:42", "throughput": 333.04, "total_tokens": 46059712} {"current_steps": 36380, "total_steps": 40000, "loss": 0.0671, "lr": 0.006025165556558931, "epoch": 1.7775633352063127, "percentage": 90.95, "elapsed_time": "1 day, 14:25:04", "remaining_time": "3:49:21", "throughput": 333.08, "total_tokens": 46065856} {"current_steps": 36385, "total_steps": 40000, "loss": 0.0759, "lr": 0.006008649451777248, "epoch": 1.777807636870007, "percentage": 90.96, "elapsed_time": "1 day, 14:25:07", "remaining_time": "3:49:01", "throughput": 333.11, "total_tokens": 46071616} {"current_steps": 36390, "total_steps": 40000, "loss": 0.0522, "lr": 0.005992155552271283, "epoch": 1.7780519385337015, "percentage": 90.97, "elapsed_time": "1 day, 14:25:10", "remaining_time": "3:48:40", "throughput": 333.15, "total_tokens": 46077792} {"current_steps": 36395, "total_steps": 40000, "loss": 0.0619, "lr": 0.005975683860584685, "epoch": 1.7782962401973958, "percentage": 90.99, "elapsed_time": "1 day, 14:25:13", "remaining_time": "3:48:20", "throughput": 333.19, "total_tokens": 46084384} {"current_steps": 36400, "total_steps": 40000, "loss": 0.0583, "lr": 0.0059592343792575385, "epoch": 1.7785405418610902, "percentage": 91.0, "elapsed_time": "1 day, 14:25:16", "remaining_time": "3:47:59", "throughput": 333.23, "total_tokens": 46091136} {"current_steps": 36400, "total_steps": 40000, "eval_loss": 0.060653794556856155, "epoch": 1.7785405418610902, "percentage": 91.0, "elapsed_time": "1 day, 14:35:50", "remaining_time": "3:49:02", "throughput": 331.71, "total_tokens": 46091136} {"current_steps": 36405, "total_steps": 40000, "loss": 0.0432, "lr": 0.0059428071108265975, "epoch": 1.7787848435247844, "percentage": 91.01, "elapsed_time": "1 day, 14:35:53", "remaining_time": "3:48:41", "throughput": 331.74, "total_tokens": 46097088} {"current_steps": 36410, "total_steps": 40000, "loss": 0.0597, "lr": 0.005926402057825136, "epoch": 1.7790291451884788, "percentage": 91.03, "elapsed_time": "1 day, 14:35:56", "remaining_time": "3:48:21", "throughput": 331.78, "total_tokens": 46103296} {"current_steps": 36415, "total_steps": 40000, "loss": 0.0416, "lr": 0.005910019222782997, "epoch": 1.779273446852173, "percentage": 91.04, "elapsed_time": "1 day, 14:36:00", "remaining_time": "3:48:00", "throughput": 331.82, "total_tokens": 46109728} {"current_steps": 36420, "total_steps": 40000, "loss": 0.053, "lr": 0.005893658608226643, "epoch": 1.7795177485158673, "percentage": 91.05, "elapsed_time": "1 day, 14:36:03", "remaining_time": "3:47:39", "throughput": 331.86, "total_tokens": 46115872} {"current_steps": 36425, "total_steps": 40000, "loss": 0.0471, "lr": 0.0058773202166791045, "epoch": 1.7797620501795617, "percentage": 91.06, "elapsed_time": "1 day, 14:36:06", "remaining_time": "3:47:19", "throughput": 331.9, "total_tokens": 46122176} {"current_steps": 36430, "total_steps": 40000, "loss": 0.0429, "lr": 0.005861004050659918, "epoch": 1.780006351843256, "percentage": 91.07, "elapsed_time": "1 day, 14:36:09", "remaining_time": "3:46:58", "throughput": 331.93, "total_tokens": 46128352} {"current_steps": 36435, "total_steps": 40000, "loss": 0.0558, "lr": 0.005844710112685286, "epoch": 1.7802506535069504, "percentage": 91.09, "elapsed_time": "1 day, 14:36:12", "remaining_time": "3:46:37", "throughput": 331.97, "total_tokens": 46134752} {"current_steps": 36440, "total_steps": 40000, "loss": 0.0433, "lr": 0.005828438405267933, "epoch": 1.7804949551706448, "percentage": 91.1, "elapsed_time": "1 day, 14:36:15", "remaining_time": "3:46:17", "throughput": 332.01, "total_tokens": 46141312} {"current_steps": 36445, "total_steps": 40000, "loss": 0.0364, "lr": 0.00581218893091715, "epoch": 1.7807392568343392, "percentage": 91.11, "elapsed_time": "1 day, 14:36:18", "remaining_time": "3:45:56", "throughput": 332.05, "total_tokens": 46147424} {"current_steps": 36450, "total_steps": 40000, "loss": 0.0692, "lr": 0.005795961692138801, "epoch": 1.7809835584980334, "percentage": 91.12, "elapsed_time": "1 day, 14:36:21", "remaining_time": "3:45:35", "throughput": 332.09, "total_tokens": 46153760} {"current_steps": 36455, "total_steps": 40000, "loss": 0.0626, "lr": 0.00577975669143535, "epoch": 1.7812278601617277, "percentage": 91.14, "elapsed_time": "1 day, 14:36:24", "remaining_time": "3:45:15", "throughput": 332.12, "total_tokens": 46160224} {"current_steps": 36460, "total_steps": 40000, "loss": 0.0627, "lr": 0.005763573931305782, "epoch": 1.781472161825422, "percentage": 91.15, "elapsed_time": "1 day, 14:36:27", "remaining_time": "3:44:54", "throughput": 332.16, "total_tokens": 46166624} {"current_steps": 36465, "total_steps": 40000, "loss": 0.0587, "lr": 0.005747413414245733, "epoch": 1.7817164634891163, "percentage": 91.16, "elapsed_time": "1 day, 14:36:30", "remaining_time": "3:44:34", "throughput": 332.2, "total_tokens": 46172672} {"current_steps": 36470, "total_steps": 40000, "loss": 0.0613, "lr": 0.005731275142747294, "epoch": 1.7819607651528107, "percentage": 91.17, "elapsed_time": "1 day, 14:36:33", "remaining_time": "3:44:13", "throughput": 332.24, "total_tokens": 46178784} {"current_steps": 36475, "total_steps": 40000, "loss": 0.042, "lr": 0.005715159119299256, "epoch": 1.782205066816505, "percentage": 91.19, "elapsed_time": "1 day, 14:36:36", "remaining_time": "3:43:52", "throughput": 332.28, "total_tokens": 46185280} {"current_steps": 36480, "total_steps": 40000, "loss": 0.0558, "lr": 0.005699065346386867, "epoch": 1.7824493684801994, "percentage": 91.2, "elapsed_time": "1 day, 14:36:39", "remaining_time": "3:43:32", "throughput": 332.31, "total_tokens": 46191584} {"current_steps": 36485, "total_steps": 40000, "loss": 0.0586, "lr": 0.0056829938264919885, "epoch": 1.7826936701438938, "percentage": 91.21, "elapsed_time": "1 day, 14:36:42", "remaining_time": "3:43:11", "throughput": 332.36, "total_tokens": 46198400} {"current_steps": 36490, "total_steps": 40000, "loss": 0.0832, "lr": 0.005666944562093074, "epoch": 1.7829379718075882, "percentage": 91.22, "elapsed_time": "1 day, 14:36:46", "remaining_time": "3:42:51", "throughput": 332.39, "total_tokens": 46204832} {"current_steps": 36495, "total_steps": 40000, "loss": 0.0787, "lr": 0.005650917555665108, "epoch": 1.7831822734712823, "percentage": 91.24, "elapsed_time": "1 day, 14:36:49", "remaining_time": "3:42:30", "throughput": 332.43, "total_tokens": 46210976} {"current_steps": 36500, "total_steps": 40000, "loss": 0.0664, "lr": 0.005634912809679632, "epoch": 1.7834265751349767, "percentage": 91.25, "elapsed_time": "1 day, 14:36:52", "remaining_time": "3:42:09", "throughput": 332.47, "total_tokens": 46217440} {"current_steps": 36505, "total_steps": 40000, "loss": 0.067, "lr": 0.005618930326604854, "epoch": 1.7836708767986709, "percentage": 91.26, "elapsed_time": "1 day, 14:36:55", "remaining_time": "3:41:49", "throughput": 332.5, "total_tokens": 46223072} {"current_steps": 36510, "total_steps": 40000, "loss": 0.0812, "lr": 0.005602970108905386, "epoch": 1.7839151784623652, "percentage": 91.27, "elapsed_time": "1 day, 14:36:58", "remaining_time": "3:41:28", "throughput": 332.54, "total_tokens": 46229472} {"current_steps": 36515, "total_steps": 40000, "loss": 0.0512, "lr": 0.005587032159042543, "epoch": 1.7841594801260596, "percentage": 91.29, "elapsed_time": "1 day, 14:37:01", "remaining_time": "3:41:08", "throughput": 332.58, "total_tokens": 46236096} {"current_steps": 36520, "total_steps": 40000, "loss": 0.0408, "lr": 0.005571116479474158, "epoch": 1.784403781789754, "percentage": 91.3, "elapsed_time": "1 day, 14:37:04", "remaining_time": "3:40:47", "throughput": 332.62, "total_tokens": 46242560} {"current_steps": 36525, "total_steps": 40000, "loss": 0.0245, "lr": 0.005555223072654619, "epoch": 1.7846480834534484, "percentage": 91.31, "elapsed_time": "1 day, 14:37:07", "remaining_time": "3:40:27", "throughput": 332.66, "total_tokens": 46249024} {"current_steps": 36530, "total_steps": 40000, "loss": 0.0725, "lr": 0.005539351941034881, "epoch": 1.7848923851171428, "percentage": 91.33, "elapsed_time": "1 day, 14:37:10", "remaining_time": "3:40:06", "throughput": 332.7, "total_tokens": 46255936} {"current_steps": 36535, "total_steps": 40000, "loss": 0.0542, "lr": 0.0055235030870624865, "epoch": 1.785136686780837, "percentage": 91.34, "elapsed_time": "1 day, 14:37:13", "remaining_time": "3:39:46", "throughput": 332.74, "total_tokens": 46262336} {"current_steps": 36540, "total_steps": 40000, "loss": 0.0695, "lr": 0.005507676513181514, "epoch": 1.7853809884445313, "percentage": 91.35, "elapsed_time": "1 day, 14:37:16", "remaining_time": "3:39:25", "throughput": 332.78, "total_tokens": 46268736} {"current_steps": 36545, "total_steps": 40000, "loss": 0.0665, "lr": 0.005491872221832628, "epoch": 1.7856252901082257, "percentage": 91.36, "elapsed_time": "1 day, 14:37:19", "remaining_time": "3:39:04", "throughput": 332.82, "total_tokens": 46275040} {"current_steps": 36550, "total_steps": 40000, "loss": 0.0399, "lr": 0.005476090215453061, "epoch": 1.7858695917719198, "percentage": 91.38, "elapsed_time": "1 day, 14:37:23", "remaining_time": "3:38:44", "throughput": 332.86, "total_tokens": 46281472} {"current_steps": 36555, "total_steps": 40000, "loss": 0.059, "lr": 0.0054603304964765675, "epoch": 1.7861138934356142, "percentage": 91.39, "elapsed_time": "1 day, 14:37:26", "remaining_time": "3:38:23", "throughput": 332.89, "total_tokens": 46287680} {"current_steps": 36560, "total_steps": 40000, "loss": 0.0439, "lr": 0.005444593067333519, "epoch": 1.7863581950993086, "percentage": 91.4, "elapsed_time": "1 day, 14:37:29", "remaining_time": "3:38:03", "throughput": 332.93, "total_tokens": 46293856} {"current_steps": 36565, "total_steps": 40000, "loss": 0.0473, "lr": 0.00542887793045081, "epoch": 1.786602496763003, "percentage": 91.41, "elapsed_time": "1 day, 14:37:32", "remaining_time": "3:37:42", "throughput": 332.97, "total_tokens": 46300416} {"current_steps": 36570, "total_steps": 40000, "loss": 0.0528, "lr": 0.005413185088251932, "epoch": 1.7868467984266974, "percentage": 91.42, "elapsed_time": "1 day, 14:37:35", "remaining_time": "3:37:22", "throughput": 333.01, "total_tokens": 46306720} {"current_steps": 36575, "total_steps": 40000, "loss": 0.0478, "lr": 0.005397514543156884, "epoch": 1.7870911000903917, "percentage": 91.44, "elapsed_time": "1 day, 14:37:38", "remaining_time": "3:37:01", "throughput": 333.05, "total_tokens": 46312672} {"current_steps": 36580, "total_steps": 40000, "loss": 0.0641, "lr": 0.0053818662975822825, "epoch": 1.787335401754086, "percentage": 91.45, "elapsed_time": "1 day, 14:37:41", "remaining_time": "3:36:41", "throughput": 333.08, "total_tokens": 46319008} {"current_steps": 36585, "total_steps": 40000, "loss": 0.0729, "lr": 0.005366240353941315, "epoch": 1.7875797034177803, "percentage": 91.46, "elapsed_time": "1 day, 14:37:44", "remaining_time": "3:36:20", "throughput": 333.12, "total_tokens": 46325376} {"current_steps": 36590, "total_steps": 40000, "loss": 0.0413, "lr": 0.005350636714643636, "epoch": 1.7878240050814747, "percentage": 91.47, "elapsed_time": "1 day, 14:37:47", "remaining_time": "3:36:00", "throughput": 333.16, "total_tokens": 46331712} {"current_steps": 36595, "total_steps": 40000, "loss": 0.0462, "lr": 0.005335055382095555, "epoch": 1.7880683067451688, "percentage": 91.49, "elapsed_time": "1 day, 14:37:50", "remaining_time": "3:35:39", "throughput": 333.2, "total_tokens": 46337728} {"current_steps": 36600, "total_steps": 40000, "loss": 0.0565, "lr": 0.005319496358699915, "epoch": 1.7883126084088632, "percentage": 91.5, "elapsed_time": "1 day, 14:37:53", "remaining_time": "3:35:19", "throughput": 333.23, "total_tokens": 46343744} {"current_steps": 36600, "total_steps": 40000, "eval_loss": 0.06051120162010193, "epoch": 1.7883126084088632, "percentage": 91.5, "elapsed_time": "1 day, 14:48:28", "remaining_time": "3:36:18", "throughput": 331.72, "total_tokens": 46343744} {"current_steps": 36605, "total_steps": 40000, "loss": 0.0663, "lr": 0.005303959646856099, "epoch": 1.7885569100725576, "percentage": 91.51, "elapsed_time": "1 day, 14:48:38", "remaining_time": "3:35:58", "throughput": 331.74, "total_tokens": 46350400} {"current_steps": 36610, "total_steps": 40000, "loss": 0.0648, "lr": 0.005288445248960089, "epoch": 1.788801211736252, "percentage": 91.53, "elapsed_time": "1 day, 14:48:41", "remaining_time": "3:35:37", "throughput": 331.78, "total_tokens": 46356768} {"current_steps": 36615, "total_steps": 40000, "loss": 0.0404, "lr": 0.005272953167404354, "epoch": 1.7890455133999463, "percentage": 91.54, "elapsed_time": "1 day, 14:48:44", "remaining_time": "3:35:17", "throughput": 331.82, "total_tokens": 46363040} {"current_steps": 36620, "total_steps": 40000, "loss": 0.0674, "lr": 0.005257483404578017, "epoch": 1.7892898150636407, "percentage": 91.55, "elapsed_time": "1 day, 14:48:47", "remaining_time": "3:34:56", "throughput": 331.86, "total_tokens": 46369216} {"current_steps": 36625, "total_steps": 40000, "loss": 0.0337, "lr": 0.0052420359628666865, "epoch": 1.7895341167273349, "percentage": 91.56, "elapsed_time": "1 day, 14:48:50", "remaining_time": "3:34:36", "throughput": 331.89, "total_tokens": 46375424} {"current_steps": 36630, "total_steps": 40000, "loss": 0.0609, "lr": 0.00522661084465254, "epoch": 1.7897784183910292, "percentage": 91.57, "elapsed_time": "1 day, 14:48:53", "remaining_time": "3:34:15", "throughput": 331.93, "total_tokens": 46381888} {"current_steps": 36635, "total_steps": 40000, "loss": 0.0555, "lr": 0.005211208052314326, "epoch": 1.7900227200547236, "percentage": 91.59, "elapsed_time": "1 day, 14:48:56", "remaining_time": "3:33:55", "throughput": 331.97, "total_tokens": 46388288} {"current_steps": 36640, "total_steps": 40000, "loss": 0.0498, "lr": 0.005195827588227391, "epoch": 1.7902670217184178, "percentage": 91.6, "elapsed_time": "1 day, 14:48:59", "remaining_time": "3:33:34", "throughput": 332.01, "total_tokens": 46394752} {"current_steps": 36645, "total_steps": 40000, "loss": 0.0761, "lr": 0.0051804694547635255, "epoch": 1.7905113233821122, "percentage": 91.61, "elapsed_time": "1 day, 14:49:02", "remaining_time": "3:33:14", "throughput": 332.05, "total_tokens": 46401280} {"current_steps": 36650, "total_steps": 40000, "loss": 0.0807, "lr": 0.005165133654291232, "epoch": 1.7907556250458065, "percentage": 91.62, "elapsed_time": "1 day, 14:49:05", "remaining_time": "3:32:53", "throughput": 332.08, "total_tokens": 46407296} {"current_steps": 36655, "total_steps": 40000, "loss": 0.0384, "lr": 0.005149820189175402, "epoch": 1.790999926709501, "percentage": 91.64, "elapsed_time": "1 day, 14:49:08", "remaining_time": "3:32:32", "throughput": 332.13, "total_tokens": 46414080} {"current_steps": 36660, "total_steps": 40000, "loss": 0.075, "lr": 0.005134529061777598, "epoch": 1.7912442283731953, "percentage": 91.65, "elapsed_time": "1 day, 14:49:11", "remaining_time": "3:32:12", "throughput": 332.16, "total_tokens": 46420480} {"current_steps": 36665, "total_steps": 40000, "loss": 0.0671, "lr": 0.005119260274455933, "epoch": 1.7914885300368897, "percentage": 91.66, "elapsed_time": "1 day, 14:49:14", "remaining_time": "3:31:51", "throughput": 332.2, "total_tokens": 46426272} {"current_steps": 36670, "total_steps": 40000, "loss": 0.0522, "lr": 0.005104013829565007, "epoch": 1.7917328317005838, "percentage": 91.67, "elapsed_time": "1 day, 14:49:17", "remaining_time": "3:31:31", "throughput": 332.23, "total_tokens": 46432288} {"current_steps": 36675, "total_steps": 40000, "loss": 0.0379, "lr": 0.005088789729456006, "epoch": 1.7919771333642782, "percentage": 91.69, "elapsed_time": "1 day, 14:49:20", "remaining_time": "3:31:10", "throughput": 332.27, "total_tokens": 46438880} {"current_steps": 36680, "total_steps": 40000, "loss": 0.0688, "lr": 0.005073587976476735, "epoch": 1.7922214350279724, "percentage": 91.7, "elapsed_time": "1 day, 14:49:23", "remaining_time": "3:30:50", "throughput": 332.31, "total_tokens": 46445152} {"current_steps": 36685, "total_steps": 40000, "loss": 0.0609, "lr": 0.005058408572971418, "epoch": 1.7924657366916668, "percentage": 91.71, "elapsed_time": "1 day, 14:49:26", "remaining_time": "3:30:29", "throughput": 332.34, "total_tokens": 46450816} {"current_steps": 36690, "total_steps": 40000, "loss": 0.0401, "lr": 0.005043251521280983, "epoch": 1.7927100383553611, "percentage": 91.72, "elapsed_time": "1 day, 14:49:29", "remaining_time": "3:30:09", "throughput": 332.38, "total_tokens": 46457408} {"current_steps": 36695, "total_steps": 40000, "loss": 0.0578, "lr": 0.005028116823742795, "epoch": 1.7929543400190555, "percentage": 91.74, "elapsed_time": "1 day, 14:49:33", "remaining_time": "3:29:48", "throughput": 332.42, "total_tokens": 46463968} {"current_steps": 36700, "total_steps": 40000, "loss": 0.0664, "lr": 0.005013004482690819, "epoch": 1.79319864168275, "percentage": 91.75, "elapsed_time": "1 day, 14:49:36", "remaining_time": "3:29:28", "throughput": 332.46, "total_tokens": 46470432} {"current_steps": 36705, "total_steps": 40000, "loss": 0.0486, "lr": 0.0049979145004555746, "epoch": 1.7934429433464443, "percentage": 91.76, "elapsed_time": "1 day, 14:49:39", "remaining_time": "3:29:07", "throughput": 332.5, "total_tokens": 46476992} {"current_steps": 36710, "total_steps": 40000, "loss": 0.0587, "lr": 0.004982846879364116, "epoch": 1.7936872450101387, "percentage": 91.77, "elapsed_time": "1 day, 14:49:42", "remaining_time": "3:28:47", "throughput": 332.54, "total_tokens": 46483520} {"current_steps": 36715, "total_steps": 40000, "loss": 0.0383, "lr": 0.0049678016217400535, "epoch": 1.7939315466738328, "percentage": 91.79, "elapsed_time": "1 day, 14:49:45", "remaining_time": "3:28:27", "throughput": 332.58, "total_tokens": 46489568} {"current_steps": 36720, "total_steps": 40000, "loss": 0.0697, "lr": 0.004952778729903595, "epoch": 1.7941758483375272, "percentage": 91.8, "elapsed_time": "1 day, 14:49:48", "remaining_time": "3:28:06", "throughput": 332.62, "total_tokens": 46495808} {"current_steps": 36725, "total_steps": 40000, "loss": 0.0429, "lr": 0.004937778206171422, "epoch": 1.7944201500012213, "percentage": 91.81, "elapsed_time": "1 day, 14:49:51", "remaining_time": "3:27:46", "throughput": 332.65, "total_tokens": 46501920} {"current_steps": 36730, "total_steps": 40000, "loss": 0.0565, "lr": 0.004922800052856835, "epoch": 1.7946644516649157, "percentage": 91.83, "elapsed_time": "1 day, 14:49:54", "remaining_time": "3:27:25", "throughput": 332.69, "total_tokens": 46508224} {"current_steps": 36735, "total_steps": 40000, "loss": 0.0783, "lr": 0.004907844272269602, "epoch": 1.79490875332861, "percentage": 91.84, "elapsed_time": "1 day, 14:49:57", "remaining_time": "3:27:05", "throughput": 332.73, "total_tokens": 46514560} {"current_steps": 36740, "total_steps": 40000, "loss": 0.0715, "lr": 0.004892910866716144, "epoch": 1.7951530549923045, "percentage": 91.85, "elapsed_time": "1 day, 14:50:00", "remaining_time": "3:26:44", "throughput": 332.76, "total_tokens": 46520352} {"current_steps": 36745, "total_steps": 40000, "loss": 0.043, "lr": 0.004877999838499369, "epoch": 1.7953973566559989, "percentage": 91.86, "elapsed_time": "1 day, 14:50:03", "remaining_time": "3:26:24", "throughput": 332.8, "total_tokens": 46527360} {"current_steps": 36750, "total_steps": 40000, "loss": 0.0354, "lr": 0.0048631111899187065, "epoch": 1.7956416583196932, "percentage": 91.88, "elapsed_time": "1 day, 14:50:06", "remaining_time": "3:26:03", "throughput": 332.84, "total_tokens": 46533632} {"current_steps": 36755, "total_steps": 40000, "loss": 0.0562, "lr": 0.0048482449232702335, "epoch": 1.7958859599833876, "percentage": 91.89, "elapsed_time": "1 day, 14:50:10", "remaining_time": "3:25:43", "throughput": 332.88, "total_tokens": 46540160} {"current_steps": 36760, "total_steps": 40000, "loss": 0.0737, "lr": 0.004833401040846469, "epoch": 1.7961302616470818, "percentage": 91.9, "elapsed_time": "1 day, 14:50:13", "remaining_time": "3:25:23", "throughput": 332.92, "total_tokens": 46546848} {"current_steps": 36765, "total_steps": 40000, "loss": 0.0606, "lr": 0.004818579544936546, "epoch": 1.7963745633107762, "percentage": 91.91, "elapsed_time": "1 day, 14:50:16", "remaining_time": "3:25:02", "throughput": 332.96, "total_tokens": 46553280} {"current_steps": 36770, "total_steps": 40000, "loss": 0.0464, "lr": 0.004803780437826121, "epoch": 1.7966188649744703, "percentage": 91.92, "elapsed_time": "1 day, 14:50:19", "remaining_time": "3:24:42", "throughput": 333.0, "total_tokens": 46559424} {"current_steps": 36775, "total_steps": 40000, "loss": 0.0368, "lr": 0.004789003721797402, "epoch": 1.7968631666381647, "percentage": 91.94, "elapsed_time": "1 day, 14:50:22", "remaining_time": "3:24:21", "throughput": 333.03, "total_tokens": 46565568} {"current_steps": 36780, "total_steps": 40000, "loss": 0.0422, "lr": 0.004774249399129132, "epoch": 1.797107468301859, "percentage": 91.95, "elapsed_time": "1 day, 14:50:25", "remaining_time": "3:24:01", "throughput": 333.07, "total_tokens": 46571840} {"current_steps": 36785, "total_steps": 40000, "loss": 0.0472, "lr": 0.004759517472096642, "epoch": 1.7973517699655535, "percentage": 91.96, "elapsed_time": "1 day, 14:50:28", "remaining_time": "3:23:40", "throughput": 333.11, "total_tokens": 46578560} {"current_steps": 36790, "total_steps": 40000, "loss": 0.0402, "lr": 0.004744807942971746, "epoch": 1.7975960716292478, "percentage": 91.97, "elapsed_time": "1 day, 14:50:31", "remaining_time": "3:23:20", "throughput": 333.15, "total_tokens": 46584864} {"current_steps": 36795, "total_steps": 40000, "loss": 0.0368, "lr": 0.004730120814022881, "epoch": 1.7978403732929422, "percentage": 91.99, "elapsed_time": "1 day, 14:50:34", "remaining_time": "3:23:00", "throughput": 333.19, "total_tokens": 46591072} {"current_steps": 36800, "total_steps": 40000, "loss": 0.0677, "lr": 0.004715456087514935, "epoch": 1.7980846749566366, "percentage": 92.0, "elapsed_time": "1 day, 14:50:37", "remaining_time": "3:22:39", "throughput": 333.23, "total_tokens": 46597920} {"current_steps": 36800, "total_steps": 40000, "eval_loss": 0.06061924993991852, "epoch": 1.7980846749566366, "percentage": 92.0, "elapsed_time": "1 day, 15:01:11", "remaining_time": "3:23:34", "throughput": 331.73, "total_tokens": 46597920} {"current_steps": 36805, "total_steps": 40000, "loss": 0.0681, "lr": 0.004700813765709432, "epoch": 1.7983289766203308, "percentage": 92.01, "elapsed_time": "1 day, 15:01:15", "remaining_time": "3:23:14", "throughput": 331.76, "total_tokens": 46604416} {"current_steps": 36810, "total_steps": 40000, "loss": 0.0468, "lr": 0.004686193850864401, "epoch": 1.7985732782840251, "percentage": 92.03, "elapsed_time": "1 day, 15:01:18", "remaining_time": "3:22:54", "throughput": 331.8, "total_tokens": 46611072} {"current_steps": 36815, "total_steps": 40000, "loss": 0.0835, "lr": 0.004671596345234385, "epoch": 1.7988175799477193, "percentage": 92.04, "elapsed_time": "1 day, 15:01:21", "remaining_time": "3:22:33", "throughput": 331.84, "total_tokens": 46617536} {"current_steps": 36820, "total_steps": 40000, "loss": 0.071, "lr": 0.00465702125107052, "epoch": 1.7990618816114137, "percentage": 92.05, "elapsed_time": "1 day, 15:01:24", "remaining_time": "3:22:13", "throughput": 331.88, "total_tokens": 46624320} {"current_steps": 36825, "total_steps": 40000, "loss": 0.0323, "lr": 0.004642468570620506, "epoch": 1.799306183275108, "percentage": 92.06, "elapsed_time": "1 day, 15:01:27", "remaining_time": "3:21:52", "throughput": 331.92, "total_tokens": 46630624} {"current_steps": 36830, "total_steps": 40000, "loss": 0.0595, "lr": 0.004627938306128482, "epoch": 1.7995504849388024, "percentage": 92.07, "elapsed_time": "1 day, 15:01:30", "remaining_time": "3:21:32", "throughput": 331.96, "total_tokens": 46637024} {"current_steps": 36835, "total_steps": 40000, "loss": 0.0307, "lr": 0.004613430459835255, "epoch": 1.7997947866024968, "percentage": 92.09, "elapsed_time": "1 day, 15:01:33", "remaining_time": "3:21:11", "throughput": 332.0, "total_tokens": 46643712} {"current_steps": 36840, "total_steps": 40000, "loss": 0.066, "lr": 0.004598945033978085, "epoch": 1.8000390882661912, "percentage": 92.1, "elapsed_time": "1 day, 15:01:36", "remaining_time": "3:20:51", "throughput": 332.03, "total_tokens": 46649696} {"current_steps": 36845, "total_steps": 40000, "loss": 0.042, "lr": 0.004584482030790804, "epoch": 1.8002833899298856, "percentage": 92.11, "elapsed_time": "1 day, 15:01:40", "remaining_time": "3:20:30", "throughput": 332.07, "total_tokens": 46656352} {"current_steps": 36850, "total_steps": 40000, "loss": 0.0513, "lr": 0.004570041452503826, "epoch": 1.8005276915935797, "percentage": 92.12, "elapsed_time": "1 day, 15:01:43", "remaining_time": "3:20:10", "throughput": 332.11, "total_tokens": 46663008} {"current_steps": 36855, "total_steps": 40000, "loss": 0.0615, "lr": 0.004555623301344003, "epoch": 1.800771993257274, "percentage": 92.14, "elapsed_time": "1 day, 15:01:46", "remaining_time": "3:19:50", "throughput": 332.15, "total_tokens": 46669440} {"current_steps": 36860, "total_steps": 40000, "loss": 0.0653, "lr": 0.004541227579534857, "epoch": 1.8010162949209683, "percentage": 92.15, "elapsed_time": "1 day, 15:01:49", "remaining_time": "3:19:29", "throughput": 332.19, "total_tokens": 46675776} {"current_steps": 36865, "total_steps": 40000, "loss": 0.0319, "lr": 0.004526854289296378, "epoch": 1.8012605965846626, "percentage": 92.16, "elapsed_time": "1 day, 15:01:52", "remaining_time": "3:19:09", "throughput": 332.23, "total_tokens": 46682080} {"current_steps": 36870, "total_steps": 40000, "loss": 0.0694, "lr": 0.004512503432845078, "epoch": 1.801504898248357, "percentage": 92.17, "elapsed_time": "1 day, 15:01:55", "remaining_time": "3:18:48", "throughput": 332.27, "total_tokens": 46688512} {"current_steps": 36875, "total_steps": 40000, "loss": 0.0504, "lr": 0.004498175012394068, "epoch": 1.8017491999120514, "percentage": 92.19, "elapsed_time": "1 day, 15:01:58", "remaining_time": "3:18:28", "throughput": 332.31, "total_tokens": 46695296} {"current_steps": 36880, "total_steps": 40000, "loss": 0.0772, "lr": 0.004483869030152965, "epoch": 1.8019935015757458, "percentage": 92.2, "elapsed_time": "1 day, 15:02:01", "remaining_time": "3:18:07", "throughput": 332.34, "total_tokens": 46701376} {"current_steps": 36885, "total_steps": 40000, "loss": 0.0532, "lr": 0.004469585488327904, "epoch": 1.8022378032394402, "percentage": 92.21, "elapsed_time": "1 day, 15:02:04", "remaining_time": "3:17:47", "throughput": 332.38, "total_tokens": 46707936} {"current_steps": 36890, "total_steps": 40000, "loss": 0.0555, "lr": 0.0044553243891216395, "epoch": 1.8024821049031345, "percentage": 92.22, "elapsed_time": "1 day, 15:02:07", "remaining_time": "3:17:27", "throughput": 332.42, "total_tokens": 46714016} {"current_steps": 36895, "total_steps": 40000, "loss": 0.0526, "lr": 0.004441085734733363, "epoch": 1.8027264065668287, "percentage": 92.24, "elapsed_time": "1 day, 15:02:10", "remaining_time": "3:17:06", "throughput": 332.46, "total_tokens": 46720544} {"current_steps": 36900, "total_steps": 40000, "loss": 0.0683, "lr": 0.004426869527358884, "epoch": 1.802970708230523, "percentage": 92.25, "elapsed_time": "1 day, 15:02:14", "remaining_time": "3:16:46", "throughput": 332.5, "total_tokens": 46727040} {"current_steps": 36905, "total_steps": 40000, "loss": 0.0659, "lr": 0.0044126757691905156, "epoch": 1.8032150098942172, "percentage": 92.26, "elapsed_time": "1 day, 15:02:17", "remaining_time": "3:16:25", "throughput": 332.53, "total_tokens": 46733280} {"current_steps": 36910, "total_steps": 40000, "loss": 0.04, "lr": 0.004398504462417107, "epoch": 1.8034593115579116, "percentage": 92.27, "elapsed_time": "1 day, 15:02:20", "remaining_time": "3:16:05", "throughput": 332.57, "total_tokens": 46739488} {"current_steps": 36915, "total_steps": 40000, "loss": 0.0505, "lr": 0.0043843556092240605, "epoch": 1.803703613221606, "percentage": 92.29, "elapsed_time": "1 day, 15:02:23", "remaining_time": "3:15:45", "throughput": 332.61, "total_tokens": 46745536} {"current_steps": 36920, "total_steps": 40000, "loss": 0.0509, "lr": 0.004370229211793281, "epoch": 1.8039479148853004, "percentage": 92.3, "elapsed_time": "1 day, 15:02:26", "remaining_time": "3:15:24", "throughput": 332.64, "total_tokens": 46751712} {"current_steps": 36925, "total_steps": 40000, "loss": 0.0585, "lr": 0.0043561252723032405, "epoch": 1.8041922165489948, "percentage": 92.31, "elapsed_time": "1 day, 15:02:29", "remaining_time": "3:15:04", "throughput": 332.68, "total_tokens": 46757568} {"current_steps": 36930, "total_steps": 40000, "loss": 0.069, "lr": 0.004342043792929001, "epoch": 1.8044365182126891, "percentage": 92.33, "elapsed_time": "1 day, 15:02:32", "remaining_time": "3:14:44", "throughput": 332.71, "total_tokens": 46763552} {"current_steps": 36935, "total_steps": 40000, "loss": 0.064, "lr": 0.004327984775842025, "epoch": 1.8046808198763835, "percentage": 92.34, "elapsed_time": "1 day, 15:02:35", "remaining_time": "3:14:23", "throughput": 332.75, "total_tokens": 46769504} {"current_steps": 36940, "total_steps": 40000, "loss": 0.0489, "lr": 0.004313948223210428, "epoch": 1.8049251215400777, "percentage": 92.35, "elapsed_time": "1 day, 15:02:38", "remaining_time": "3:14:03", "throughput": 332.79, "total_tokens": 46775744} {"current_steps": 36945, "total_steps": 40000, "loss": 0.0659, "lr": 0.004299934137198846, "epoch": 1.805169423203772, "percentage": 92.36, "elapsed_time": "1 day, 15:02:41", "remaining_time": "3:13:43", "throughput": 332.82, "total_tokens": 46781664} {"current_steps": 36950, "total_steps": 40000, "loss": 0.0525, "lr": 0.004285942519968383, "epoch": 1.8054137248674662, "percentage": 92.38, "elapsed_time": "1 day, 15:02:44", "remaining_time": "3:13:22", "throughput": 332.86, "total_tokens": 46788160} {"current_steps": 36955, "total_steps": 40000, "loss": 0.0726, "lr": 0.004271973373676746, "epoch": 1.8056580265311606, "percentage": 92.39, "elapsed_time": "1 day, 15:02:47", "remaining_time": "3:13:02", "throughput": 332.9, "total_tokens": 46794304} {"current_steps": 36960, "total_steps": 40000, "loss": 0.0745, "lr": 0.004258026700478146, "epoch": 1.805902328194855, "percentage": 92.4, "elapsed_time": "1 day, 15:02:50", "remaining_time": "3:12:42", "throughput": 332.93, "total_tokens": 46800352} {"current_steps": 36965, "total_steps": 40000, "loss": 0.0678, "lr": 0.004244102502523328, "epoch": 1.8061466298585493, "percentage": 92.41, "elapsed_time": "1 day, 15:02:53", "remaining_time": "3:12:21", "throughput": 332.97, "total_tokens": 46806496} {"current_steps": 36970, "total_steps": 40000, "loss": 0.0824, "lr": 0.004230200781959592, "epoch": 1.8063909315222437, "percentage": 92.42, "elapsed_time": "1 day, 15:02:56", "remaining_time": "3:12:01", "throughput": 333.0, "total_tokens": 46812256} {"current_steps": 36975, "total_steps": 40000, "loss": 0.0537, "lr": 0.004216321540930756, "epoch": 1.806635233185938, "percentage": 92.44, "elapsed_time": "1 day, 15:02:59", "remaining_time": "3:11:41", "throughput": 333.04, "total_tokens": 46818688} {"current_steps": 36980, "total_steps": 40000, "loss": 0.059, "lr": 0.004202464781577175, "epoch": 1.8068795348496325, "percentage": 92.45, "elapsed_time": "1 day, 15:03:02", "remaining_time": "3:11:20", "throughput": 333.08, "total_tokens": 46825184} {"current_steps": 36985, "total_steps": 40000, "loss": 0.0687, "lr": 0.00418863050603574, "epoch": 1.8071238365133266, "percentage": 92.46, "elapsed_time": "1 day, 15:03:05", "remaining_time": "3:11:00", "throughput": 333.11, "total_tokens": 46831104} {"current_steps": 36990, "total_steps": 40000, "loss": 0.0609, "lr": 0.004174818716439843, "epoch": 1.807368138177021, "percentage": 92.47, "elapsed_time": "1 day, 15:03:08", "remaining_time": "3:10:40", "throughput": 333.15, "total_tokens": 46837440} {"current_steps": 36995, "total_steps": 40000, "loss": 0.0778, "lr": 0.004161029414919464, "epoch": 1.8076124398407152, "percentage": 92.49, "elapsed_time": "1 day, 15:03:11", "remaining_time": "3:10:19", "throughput": 333.19, "total_tokens": 46844224} {"current_steps": 37000, "total_steps": 40000, "loss": 0.0486, "lr": 0.004147262603601071, "epoch": 1.8078567415044096, "percentage": 92.5, "elapsed_time": "1 day, 15:03:14", "remaining_time": "3:09:59", "throughput": 333.23, "total_tokens": 46850336} {"current_steps": 37000, "total_steps": 40000, "eval_loss": 0.06101835519075394, "epoch": 1.8078567415044096, "percentage": 92.5, "elapsed_time": "1 day, 15:13:48", "remaining_time": "3:10:50", "throughput": 331.73, "total_tokens": 46850336} {"current_steps": 37005, "total_steps": 40000, "loss": 0.0615, "lr": 0.004133518284607679, "epoch": 1.808101043168104, "percentage": 92.51, "elapsed_time": "1 day, 15:13:52", "remaining_time": "3:10:30", "throughput": 331.77, "total_tokens": 46856768} {"current_steps": 37010, "total_steps": 40000, "loss": 0.0539, "lr": 0.004119796460058861, "epoch": 1.8083453448317983, "percentage": 92.53, "elapsed_time": "1 day, 15:13:55", "remaining_time": "3:10:10", "throughput": 331.81, "total_tokens": 46862944} {"current_steps": 37015, "total_steps": 40000, "loss": 0.0437, "lr": 0.00410609713207064, "epoch": 1.8085896464954927, "percentage": 92.54, "elapsed_time": "1 day, 15:13:58", "remaining_time": "3:09:49", "throughput": 331.84, "total_tokens": 46869344} {"current_steps": 37020, "total_steps": 40000, "loss": 0.0381, "lr": 0.004092420302755678, "epoch": 1.808833948159187, "percentage": 92.55, "elapsed_time": "1 day, 15:14:01", "remaining_time": "3:09:29", "throughput": 331.89, "total_tokens": 46876320} {"current_steps": 37025, "total_steps": 40000, "loss": 0.0335, "lr": 0.004078765974223103, "epoch": 1.8090782498228815, "percentage": 92.56, "elapsed_time": "1 day, 15:14:04", "remaining_time": "3:09:09", "throughput": 331.92, "total_tokens": 46881984} {"current_steps": 37030, "total_steps": 40000, "loss": 0.0791, "lr": 0.004065134148578564, "epoch": 1.8093225514865756, "percentage": 92.58, "elapsed_time": "1 day, 15:14:07", "remaining_time": "3:08:48", "throughput": 331.95, "total_tokens": 46887904} {"current_steps": 37035, "total_steps": 40000, "loss": 0.0462, "lr": 0.004051524827924279, "epoch": 1.80956685315027, "percentage": 92.59, "elapsed_time": "1 day, 15:14:10", "remaining_time": "3:08:28", "throughput": 331.99, "total_tokens": 46894400} {"current_steps": 37040, "total_steps": 40000, "loss": 0.0805, "lr": 0.004037938014358955, "epoch": 1.8098111548139642, "percentage": 92.6, "elapsed_time": "1 day, 15:14:14", "remaining_time": "3:08:08", "throughput": 332.03, "total_tokens": 46900480} {"current_steps": 37045, "total_steps": 40000, "loss": 0.0683, "lr": 0.004024373709977863, "epoch": 1.8100554564776585, "percentage": 92.61, "elapsed_time": "1 day, 15:14:17", "remaining_time": "3:07:47", "throughput": 332.07, "total_tokens": 46907200} {"current_steps": 37050, "total_steps": 40000, "loss": 0.0523, "lr": 0.004010831916872814, "epoch": 1.810299758141353, "percentage": 92.62, "elapsed_time": "1 day, 15:14:20", "remaining_time": "3:07:27", "throughput": 332.11, "total_tokens": 46913952} {"current_steps": 37055, "total_steps": 40000, "loss": 0.0592, "lr": 0.003997312637132089, "epoch": 1.8105440598050473, "percentage": 92.64, "elapsed_time": "1 day, 15:14:23", "remaining_time": "3:07:07", "throughput": 332.15, "total_tokens": 46920416} {"current_steps": 37060, "total_steps": 40000, "loss": 0.0552, "lr": 0.003983815872840535, "epoch": 1.8107883614687417, "percentage": 92.65, "elapsed_time": "1 day, 15:14:26", "remaining_time": "3:06:46", "throughput": 332.18, "total_tokens": 46926432} {"current_steps": 37065, "total_steps": 40000, "loss": 0.053, "lr": 0.003970341626079521, "epoch": 1.811032663132436, "percentage": 92.66, "elapsed_time": "1 day, 15:14:29", "remaining_time": "3:06:26", "throughput": 332.22, "total_tokens": 46932768} {"current_steps": 37070, "total_steps": 40000, "loss": 0.0749, "lr": 0.003956889898926952, "epoch": 1.8112769647961302, "percentage": 92.67, "elapsed_time": "1 day, 15:14:32", "remaining_time": "3:06:06", "throughput": 332.26, "total_tokens": 46938848} {"current_steps": 37075, "total_steps": 40000, "loss": 0.0595, "lr": 0.0039434606934572675, "epoch": 1.8115212664598246, "percentage": 92.69, "elapsed_time": "1 day, 15:14:35", "remaining_time": "3:05:45", "throughput": 332.3, "total_tokens": 46945440} {"current_steps": 37080, "total_steps": 40000, "loss": 0.051, "lr": 0.003930054011741396, "epoch": 1.811765568123519, "percentage": 92.7, "elapsed_time": "1 day, 15:14:38", "remaining_time": "3:05:25", "throughput": 332.33, "total_tokens": 46951808} {"current_steps": 37085, "total_steps": 40000, "loss": 0.0451, "lr": 0.0039166698558468155, "epoch": 1.8120098697872131, "percentage": 92.71, "elapsed_time": "1 day, 15:14:41", "remaining_time": "3:05:05", "throughput": 332.37, "total_tokens": 46958400} {"current_steps": 37090, "total_steps": 40000, "loss": 0.0498, "lr": 0.0039033082278375594, "epoch": 1.8122541714509075, "percentage": 92.73, "elapsed_time": "1 day, 15:14:44", "remaining_time": "3:04:44", "throughput": 332.41, "total_tokens": 46965056} {"current_steps": 37095, "total_steps": 40000, "loss": 0.0384, "lr": 0.003889969129774112, "epoch": 1.8124984731146019, "percentage": 92.74, "elapsed_time": "1 day, 15:14:47", "remaining_time": "3:04:24", "throughput": 332.45, "total_tokens": 46971040} {"current_steps": 37100, "total_steps": 40000, "loss": 0.0492, "lr": 0.0038766525637135784, "epoch": 1.8127427747782963, "percentage": 92.75, "elapsed_time": "1 day, 15:14:51", "remaining_time": "3:04:04", "throughput": 332.49, "total_tokens": 46977344} {"current_steps": 37105, "total_steps": 40000, "loss": 0.0457, "lr": 0.0038633585317095318, "epoch": 1.8129870764419906, "percentage": 92.76, "elapsed_time": "1 day, 15:14:54", "remaining_time": "3:03:44", "throughput": 332.53, "total_tokens": 46983872} {"current_steps": 37110, "total_steps": 40000, "loss": 0.0468, "lr": 0.00385008703581205, "epoch": 1.813231378105685, "percentage": 92.77, "elapsed_time": "1 day, 15:14:57", "remaining_time": "3:03:23", "throughput": 332.56, "total_tokens": 46990080} {"current_steps": 37115, "total_steps": 40000, "loss": 0.0725, "lr": 0.0038368380780677944, "epoch": 1.8134756797693792, "percentage": 92.79, "elapsed_time": "1 day, 15:15:00", "remaining_time": "3:03:03", "throughput": 332.6, "total_tokens": 46996224} {"current_steps": 37120, "total_steps": 40000, "loss": 0.0439, "lr": 0.003823611660519882, "epoch": 1.8137199814330736, "percentage": 92.8, "elapsed_time": "1 day, 15:15:03", "remaining_time": "3:02:43", "throughput": 332.64, "total_tokens": 47002496} {"current_steps": 37125, "total_steps": 40000, "loss": 0.0505, "lr": 0.0038104077852080475, "epoch": 1.813964283096768, "percentage": 92.81, "elapsed_time": "1 day, 15:15:06", "remaining_time": "3:02:22", "throughput": 332.67, "total_tokens": 47008640} {"current_steps": 37130, "total_steps": 40000, "loss": 0.05, "lr": 0.003797226454168462, "epoch": 1.814208584760462, "percentage": 92.83, "elapsed_time": "1 day, 15:15:09", "remaining_time": "3:02:02", "throughput": 332.71, "total_tokens": 47015200} {"current_steps": 37135, "total_steps": 40000, "loss": 0.0333, "lr": 0.003784067669433849, "epoch": 1.8144528864241565, "percentage": 92.84, "elapsed_time": "1 day, 15:15:12", "remaining_time": "3:01:42", "throughput": 332.75, "total_tokens": 47021664} {"current_steps": 37140, "total_steps": 40000, "loss": 0.0574, "lr": 0.0037709314330334528, "epoch": 1.8146971880878509, "percentage": 92.85, "elapsed_time": "1 day, 15:15:15", "remaining_time": "3:01:22", "throughput": 332.79, "total_tokens": 47027808} {"current_steps": 37145, "total_steps": 40000, "loss": 0.0628, "lr": 0.003757817746993086, "epoch": 1.8149414897515452, "percentage": 92.86, "elapsed_time": "1 day, 15:15:18", "remaining_time": "3:01:01", "throughput": 332.82, "total_tokens": 47034272} {"current_steps": 37150, "total_steps": 40000, "loss": 0.0685, "lr": 0.0037447266133349977, "epoch": 1.8151857914152396, "percentage": 92.88, "elapsed_time": "1 day, 15:15:21", "remaining_time": "3:00:41", "throughput": 332.86, "total_tokens": 47040224} {"current_steps": 37155, "total_steps": 40000, "loss": 0.0711, "lr": 0.003731658034078039, "epoch": 1.815430093078934, "percentage": 92.89, "elapsed_time": "1 day, 15:15:24", "remaining_time": "3:00:21", "throughput": 332.9, "total_tokens": 47046816} {"current_steps": 37160, "total_steps": 40000, "loss": 0.0624, "lr": 0.0037186120112375153, "epoch": 1.8156743947426282, "percentage": 92.9, "elapsed_time": "1 day, 15:15:27", "remaining_time": "3:00:01", "throughput": 332.94, "total_tokens": 47053312} {"current_steps": 37165, "total_steps": 40000, "loss": 0.0358, "lr": 0.003705588546825317, "epoch": 1.8159186964063225, "percentage": 92.91, "elapsed_time": "1 day, 15:15:30", "remaining_time": "2:59:40", "throughput": 332.98, "total_tokens": 47059904} {"current_steps": 37170, "total_steps": 40000, "loss": 0.0487, "lr": 0.0036925876428498205, "epoch": 1.816162998070017, "percentage": 92.92, "elapsed_time": "1 day, 15:15:34", "remaining_time": "2:59:20", "throughput": 333.01, "total_tokens": 47066240} {"current_steps": 37175, "total_steps": 40000, "loss": 0.0601, "lr": 0.0036796093013159057, "epoch": 1.816407299733711, "percentage": 92.94, "elapsed_time": "1 day, 15:15:37", "remaining_time": "2:59:00", "throughput": 333.05, "total_tokens": 47072128} {"current_steps": 37180, "total_steps": 40000, "loss": 0.0707, "lr": 0.0036666535242250217, "epoch": 1.8166516013974054, "percentage": 92.95, "elapsed_time": "1 day, 15:15:40", "remaining_time": "2:58:40", "throughput": 333.09, "total_tokens": 47078464} {"current_steps": 37185, "total_steps": 40000, "loss": 0.0702, "lr": 0.003653720313575104, "epoch": 1.8168959030610998, "percentage": 92.96, "elapsed_time": "1 day, 15:15:43", "remaining_time": "2:58:20", "throughput": 333.13, "total_tokens": 47084960} {"current_steps": 37190, "total_steps": 40000, "loss": 0.073, "lr": 0.003640809671360623, "epoch": 1.8171402047247942, "percentage": 92.97, "elapsed_time": "1 day, 15:15:46", "remaining_time": "2:57:59", "throughput": 333.16, "total_tokens": 47091392} {"current_steps": 37195, "total_steps": 40000, "loss": 0.0619, "lr": 0.003627921599572553, "epoch": 1.8173845063884886, "percentage": 92.99, "elapsed_time": "1 day, 15:15:49", "remaining_time": "2:57:39", "throughput": 333.21, "total_tokens": 47098720} {"current_steps": 37200, "total_steps": 40000, "loss": 0.0443, "lr": 0.003615056100198405, "epoch": 1.817628808052183, "percentage": 93.0, "elapsed_time": "1 day, 15:15:52", "remaining_time": "2:57:19", "throughput": 333.24, "total_tokens": 47104992} {"current_steps": 37200, "total_steps": 40000, "eval_loss": 0.06071794405579567, "epoch": 1.817628808052183, "percentage": 93.0, "elapsed_time": "1 day, 15:26:26", "remaining_time": "2:58:07", "throughput": 331.76, "total_tokens": 47104992} {"current_steps": 37205, "total_steps": 40000, "loss": 0.0353, "lr": 0.003602213175222174, "epoch": 1.8178731097158771, "percentage": 93.01, "elapsed_time": "1 day, 15:26:30", "remaining_time": "2:57:46", "throughput": 331.79, "total_tokens": 47111456} {"current_steps": 37210, "total_steps": 40000, "loss": 0.0826, "lr": 0.0035893928266244432, "epoch": 1.8181174113795715, "percentage": 93.03, "elapsed_time": "1 day, 15:26:33", "remaining_time": "2:57:26", "throughput": 331.83, "total_tokens": 47117760} {"current_steps": 37215, "total_steps": 40000, "loss": 0.0739, "lr": 0.003576595056382248, "epoch": 1.8183617130432657, "percentage": 93.04, "elapsed_time": "1 day, 15:26:36", "remaining_time": "2:57:06", "throughput": 331.87, "total_tokens": 47123648} {"current_steps": 37220, "total_steps": 40000, "loss": 0.0297, "lr": 0.0035638198664691423, "epoch": 1.81860601470696, "percentage": 93.05, "elapsed_time": "1 day, 15:26:39", "remaining_time": "2:56:46", "throughput": 331.91, "total_tokens": 47130784} {"current_steps": 37225, "total_steps": 40000, "loss": 0.0622, "lr": 0.003551067258855267, "epoch": 1.8188503163706544, "percentage": 93.06, "elapsed_time": "1 day, 15:26:42", "remaining_time": "2:56:25", "throughput": 331.95, "total_tokens": 47137056} {"current_steps": 37230, "total_steps": 40000, "loss": 0.0911, "lr": 0.0035383372355071996, "epoch": 1.8190946180343488, "percentage": 93.08, "elapsed_time": "1 day, 15:26:45", "remaining_time": "2:56:05", "throughput": 331.98, "total_tokens": 47143488} {"current_steps": 37235, "total_steps": 40000, "loss": 0.0555, "lr": 0.0035256297983881023, "epoch": 1.8193389196980432, "percentage": 93.09, "elapsed_time": "1 day, 15:26:48", "remaining_time": "2:55:45", "throughput": 332.02, "total_tokens": 47149536} {"current_steps": 37240, "total_steps": 40000, "loss": 0.067, "lr": 0.0035129449494575747, "epoch": 1.8195832213617376, "percentage": 93.1, "elapsed_time": "1 day, 15:26:51", "remaining_time": "2:55:25", "throughput": 332.06, "total_tokens": 47155872} {"current_steps": 37245, "total_steps": 40000, "loss": 0.0756, "lr": 0.0035002826906718187, "epoch": 1.819827523025432, "percentage": 93.11, "elapsed_time": "1 day, 15:26:54", "remaining_time": "2:55:04", "throughput": 332.09, "total_tokens": 47161856} {"current_steps": 37250, "total_steps": 40000, "loss": 0.0727, "lr": 0.003487643023983522, "epoch": 1.820071824689126, "percentage": 93.12, "elapsed_time": "1 day, 15:26:57", "remaining_time": "2:54:44", "throughput": 332.13, "total_tokens": 47168096} {"current_steps": 37255, "total_steps": 40000, "loss": 0.0597, "lr": 0.003475025951341842, "epoch": 1.8203161263528205, "percentage": 93.14, "elapsed_time": "1 day, 15:27:00", "remaining_time": "2:54:24", "throughput": 332.17, "total_tokens": 47174432} {"current_steps": 37260, "total_steps": 40000, "loss": 0.0423, "lr": 0.00346243147469249, "epoch": 1.8205604280165146, "percentage": 93.15, "elapsed_time": "1 day, 15:27:03", "remaining_time": "2:54:04", "throughput": 332.2, "total_tokens": 47180736} {"current_steps": 37265, "total_steps": 40000, "loss": 0.0789, "lr": 0.0034498595959777446, "epoch": 1.820804729680209, "percentage": 93.16, "elapsed_time": "1 day, 15:27:06", "remaining_time": "2:53:43", "throughput": 332.24, "total_tokens": 47187040} {"current_steps": 37270, "total_steps": 40000, "loss": 0.0621, "lr": 0.003437310317136305, "epoch": 1.8210490313439034, "percentage": 93.17, "elapsed_time": "1 day, 15:27:09", "remaining_time": "2:53:23", "throughput": 332.28, "total_tokens": 47193184} {"current_steps": 37275, "total_steps": 40000, "loss": 0.0739, "lr": 0.0034247836401034236, "epoch": 1.8212933330075978, "percentage": 93.19, "elapsed_time": "1 day, 15:27:12", "remaining_time": "2:53:03", "throughput": 332.31, "total_tokens": 47199232} {"current_steps": 37280, "total_steps": 40000, "loss": 0.0559, "lr": 0.003412279566810905, "epoch": 1.8215376346712921, "percentage": 93.2, "elapsed_time": "1 day, 15:27:16", "remaining_time": "2:52:43", "throughput": 332.35, "total_tokens": 47205632} {"current_steps": 37285, "total_steps": 40000, "loss": 0.0571, "lr": 0.00339979809918699, "epoch": 1.8217819363349865, "percentage": 93.21, "elapsed_time": "1 day, 15:27:19", "remaining_time": "2:52:22", "throughput": 332.39, "total_tokens": 47212160} {"current_steps": 37290, "total_steps": 40000, "loss": 0.0353, "lr": 0.0033873392391565228, "epoch": 1.822026237998681, "percentage": 93.23, "elapsed_time": "1 day, 15:27:22", "remaining_time": "2:52:02", "throughput": 332.42, "total_tokens": 47218144} {"current_steps": 37295, "total_steps": 40000, "loss": 0.0487, "lr": 0.003374902988640782, "epoch": 1.822270539662375, "percentage": 93.24, "elapsed_time": "1 day, 15:27:25", "remaining_time": "2:51:42", "throughput": 332.46, "total_tokens": 47224768} {"current_steps": 37300, "total_steps": 40000, "loss": 0.0557, "lr": 0.0033624893495576014, "epoch": 1.8225148413260694, "percentage": 93.25, "elapsed_time": "1 day, 15:27:28", "remaining_time": "2:51:22", "throughput": 332.5, "total_tokens": 47230912} {"current_steps": 37305, "total_steps": 40000, "loss": 0.0679, "lr": 0.0033500983238213323, "epoch": 1.8227591429897636, "percentage": 93.26, "elapsed_time": "1 day, 15:27:31", "remaining_time": "2:51:02", "throughput": 332.54, "total_tokens": 47237536} {"current_steps": 37310, "total_steps": 40000, "loss": 0.0346, "lr": 0.0033377299133428126, "epoch": 1.823003444653458, "percentage": 93.27, "elapsed_time": "1 day, 15:27:34", "remaining_time": "2:50:41", "throughput": 332.58, "total_tokens": 47244000} {"current_steps": 37315, "total_steps": 40000, "loss": 0.0538, "lr": 0.003325384120029434, "epoch": 1.8232477463171524, "percentage": 93.29, "elapsed_time": "1 day, 15:27:37", "remaining_time": "2:50:21", "throughput": 332.61, "total_tokens": 47250464} {"current_steps": 37320, "total_steps": 40000, "loss": 0.0565, "lr": 0.0033130609457850233, "epoch": 1.8234920479808467, "percentage": 93.3, "elapsed_time": "1 day, 15:27:40", "remaining_time": "2:50:01", "throughput": 332.65, "total_tokens": 47256416} {"current_steps": 37325, "total_steps": 40000, "loss": 0.0615, "lr": 0.0033007603925100104, "epoch": 1.8237363496445411, "percentage": 93.31, "elapsed_time": "1 day, 15:27:43", "remaining_time": "2:49:41", "throughput": 332.69, "total_tokens": 47263168} {"current_steps": 37330, "total_steps": 40000, "loss": 0.0604, "lr": 0.003288482462101294, "epoch": 1.8239806513082355, "percentage": 93.33, "elapsed_time": "1 day, 15:27:46", "remaining_time": "2:49:21", "throughput": 332.73, "total_tokens": 47269408} {"current_steps": 37335, "total_steps": 40000, "loss": 0.0356, "lr": 0.0032762271564522605, "epoch": 1.8242249529719299, "percentage": 93.34, "elapsed_time": "1 day, 15:27:50", "remaining_time": "2:49:01", "throughput": 332.76, "total_tokens": 47275776} {"current_steps": 37340, "total_steps": 40000, "loss": 0.0623, "lr": 0.003263994477452864, "epoch": 1.824469254635624, "percentage": 93.35, "elapsed_time": "1 day, 15:27:53", "remaining_time": "2:48:40", "throughput": 332.8, "total_tokens": 47282368} {"current_steps": 37345, "total_steps": 40000, "loss": 0.0663, "lr": 0.0032517844269895125, "epoch": 1.8247135562993184, "percentage": 93.36, "elapsed_time": "1 day, 15:27:56", "remaining_time": "2:48:20", "throughput": 332.85, "total_tokens": 47289504} {"current_steps": 37350, "total_steps": 40000, "loss": 0.0709, "lr": 0.0032395970069451496, "epoch": 1.8249578579630126, "percentage": 93.38, "elapsed_time": "1 day, 15:27:59", "remaining_time": "2:48:00", "throughput": 332.88, "total_tokens": 47296000} {"current_steps": 37355, "total_steps": 40000, "loss": 0.0605, "lr": 0.0032274322191992388, "epoch": 1.825202159626707, "percentage": 93.39, "elapsed_time": "1 day, 15:28:02", "remaining_time": "2:47:40", "throughput": 332.92, "total_tokens": 47301984} {"current_steps": 37360, "total_steps": 40000, "loss": 0.0465, "lr": 0.0032152900656277294, "epoch": 1.8254464612904013, "percentage": 93.4, "elapsed_time": "1 day, 15:28:05", "remaining_time": "2:47:20", "throughput": 332.96, "total_tokens": 47308096} {"current_steps": 37365, "total_steps": 40000, "loss": 0.0431, "lr": 0.0032031705481030902, "epoch": 1.8256907629540957, "percentage": 93.41, "elapsed_time": "1 day, 15:28:08", "remaining_time": "2:47:00", "throughput": 332.99, "total_tokens": 47314144} {"current_steps": 37370, "total_steps": 40000, "loss": 0.0618, "lr": 0.0031910736684943428, "epoch": 1.82593506461779, "percentage": 93.42, "elapsed_time": "1 day, 15:28:11", "remaining_time": "2:46:40", "throughput": 333.03, "total_tokens": 47320608} {"current_steps": 37375, "total_steps": 40000, "loss": 0.0462, "lr": 0.0031789994286669453, "epoch": 1.8261793662814845, "percentage": 93.44, "elapsed_time": "1 day, 15:28:14", "remaining_time": "2:46:19", "throughput": 333.06, "total_tokens": 47326240} {"current_steps": 37380, "total_steps": 40000, "loss": 0.0626, "lr": 0.003166947830482908, "epoch": 1.8264236679451789, "percentage": 93.45, "elapsed_time": "1 day, 15:28:17", "remaining_time": "2:45:59", "throughput": 333.1, "total_tokens": 47332096} {"current_steps": 37385, "total_steps": 40000, "loss": 0.0621, "lr": 0.003154918875800727, "epoch": 1.826667969608873, "percentage": 93.46, "elapsed_time": "1 day, 15:28:20", "remaining_time": "2:45:39", "throughput": 333.14, "total_tokens": 47338656} {"current_steps": 37390, "total_steps": 40000, "loss": 0.0906, "lr": 0.00314291256647542, "epoch": 1.8269122712725674, "percentage": 93.47, "elapsed_time": "1 day, 15:28:23", "remaining_time": "2:45:19", "throughput": 333.17, "total_tokens": 47344480} {"current_steps": 37395, "total_steps": 40000, "loss": 0.0519, "lr": 0.0031309289043585375, "epoch": 1.8271565729362615, "percentage": 93.49, "elapsed_time": "1 day, 15:28:26", "remaining_time": "2:44:59", "throughput": 333.2, "total_tokens": 47350560} {"current_steps": 37400, "total_steps": 40000, "loss": 0.0565, "lr": 0.003118967891298069, "epoch": 1.827400874599956, "percentage": 93.5, "elapsed_time": "1 day, 15:28:29", "remaining_time": "2:44:39", "throughput": 333.24, "total_tokens": 47356992} {"current_steps": 37400, "total_steps": 40000, "eval_loss": 0.06050002947449684, "epoch": 1.827400874599956, "percentage": 93.5, "elapsed_time": "1 day, 15:39:03", "remaining_time": "2:45:23", "throughput": 331.76, "total_tokens": 47356992} {"current_steps": 37405, "total_steps": 40000, "loss": 0.057, "lr": 0.003107029529138572, "epoch": 1.8276451762636503, "percentage": 93.51, "elapsed_time": "1 day, 15:39:07", "remaining_time": "2:45:03", "throughput": 331.8, "total_tokens": 47363264} {"current_steps": 37410, "total_steps": 40000, "loss": 0.0859, "lr": 0.0030951138197211235, "epoch": 1.8278894779273447, "percentage": 93.53, "elapsed_time": "1 day, 15:39:10", "remaining_time": "2:44:43", "throughput": 331.83, "total_tokens": 47369600} {"current_steps": 37415, "total_steps": 40000, "loss": 0.0596, "lr": 0.0030832207648832377, "epoch": 1.828133779591039, "percentage": 93.54, "elapsed_time": "1 day, 15:39:13", "remaining_time": "2:44:22", "throughput": 331.87, "total_tokens": 47375968} {"current_steps": 37420, "total_steps": 40000, "loss": 0.0366, "lr": 0.0030713503664589635, "epoch": 1.8283780812547334, "percentage": 93.55, "elapsed_time": "1 day, 15:39:17", "remaining_time": "2:44:02", "throughput": 331.91, "total_tokens": 47382368} {"current_steps": 37425, "total_steps": 40000, "loss": 0.0735, "lr": 0.0030595026262788872, "epoch": 1.8286223829184278, "percentage": 93.56, "elapsed_time": "1 day, 15:39:20", "remaining_time": "2:43:42", "throughput": 331.95, "total_tokens": 47388768} {"current_steps": 37430, "total_steps": 40000, "loss": 0.0576, "lr": 0.00304767754617008, "epoch": 1.828866684582122, "percentage": 93.58, "elapsed_time": "1 day, 15:39:23", "remaining_time": "2:43:22", "throughput": 331.98, "total_tokens": 47394848} {"current_steps": 37435, "total_steps": 40000, "loss": 0.0466, "lr": 0.003035875127956117, "epoch": 1.8291109862458164, "percentage": 93.59, "elapsed_time": "1 day, 15:39:26", "remaining_time": "2:43:02", "throughput": 332.02, "total_tokens": 47400800} {"current_steps": 37440, "total_steps": 40000, "loss": 0.0427, "lr": 0.0030240953734570752, "epoch": 1.8293552879095105, "percentage": 93.6, "elapsed_time": "1 day, 15:39:29", "remaining_time": "2:42:42", "throughput": 332.06, "total_tokens": 47407584} {"current_steps": 37445, "total_steps": 40000, "loss": 0.0431, "lr": 0.003012338284489535, "epoch": 1.829599589573205, "percentage": 93.61, "elapsed_time": "1 day, 15:39:32", "remaining_time": "2:42:21", "throughput": 332.1, "total_tokens": 47414016} {"current_steps": 37450, "total_steps": 40000, "loss": 0.0712, "lr": 0.0030006038628665964, "epoch": 1.8298438912368993, "percentage": 93.62, "elapsed_time": "1 day, 15:39:35", "remaining_time": "2:42:01", "throughput": 332.14, "total_tokens": 47420800} {"current_steps": 37455, "total_steps": 40000, "loss": 0.0541, "lr": 0.002988892110397845, "epoch": 1.8300881929005937, "percentage": 93.64, "elapsed_time": "1 day, 15:39:38", "remaining_time": "2:41:41", "throughput": 332.17, "total_tokens": 47426848} {"current_steps": 37460, "total_steps": 40000, "loss": 0.0876, "lr": 0.0029772030288894025, "epoch": 1.830332494564288, "percentage": 93.65, "elapsed_time": "1 day, 15:39:41", "remaining_time": "2:41:21", "throughput": 332.2, "total_tokens": 47432704} {"current_steps": 37465, "total_steps": 40000, "loss": 0.0566, "lr": 0.0029655366201438438, "epoch": 1.8305767962279824, "percentage": 93.66, "elapsed_time": "1 day, 15:39:44", "remaining_time": "2:41:01", "throughput": 332.24, "total_tokens": 47439072} {"current_steps": 37470, "total_steps": 40000, "loss": 0.0705, "lr": 0.0029538928859602965, "epoch": 1.8308210978916768, "percentage": 93.67, "elapsed_time": "1 day, 15:39:47", "remaining_time": "2:40:41", "throughput": 332.28, "total_tokens": 47444928} {"current_steps": 37475, "total_steps": 40000, "loss": 0.0659, "lr": 0.002942271828134374, "epoch": 1.831065399555371, "percentage": 93.69, "elapsed_time": "1 day, 15:39:50", "remaining_time": "2:40:20", "throughput": 332.31, "total_tokens": 47451168} {"current_steps": 37480, "total_steps": 40000, "loss": 0.0316, "lr": 0.00293067344845816, "epoch": 1.8313097012190653, "percentage": 93.7, "elapsed_time": "1 day, 15:39:53", "remaining_time": "2:40:00", "throughput": 332.35, "total_tokens": 47457728} {"current_steps": 37485, "total_steps": 40000, "loss": 0.048, "lr": 0.0029190977487202896, "epoch": 1.8315540028827595, "percentage": 93.71, "elapsed_time": "1 day, 15:39:56", "remaining_time": "2:39:40", "throughput": 332.39, "total_tokens": 47463808} {"current_steps": 37490, "total_steps": 40000, "loss": 0.0667, "lr": 0.0029075447307058853, "epoch": 1.8317983045464539, "percentage": 93.73, "elapsed_time": "1 day, 15:39:59", "remaining_time": "2:39:20", "throughput": 332.42, "total_tokens": 47470112} {"current_steps": 37495, "total_steps": 40000, "loss": 0.0318, "lr": 0.0028960143961965722, "epoch": 1.8320426062101483, "percentage": 93.74, "elapsed_time": "1 day, 15:40:02", "remaining_time": "2:39:00", "throughput": 332.46, "total_tokens": 47476448} {"current_steps": 37500, "total_steps": 40000, "loss": 0.0364, "lr": 0.002884506746970461, "epoch": 1.8322869078738426, "percentage": 93.75, "elapsed_time": "1 day, 15:40:05", "remaining_time": "2:38:40", "throughput": 332.5, "total_tokens": 47482624} {"current_steps": 37505, "total_steps": 40000, "loss": 0.034, "lr": 0.0028730217848021654, "epoch": 1.832531209537537, "percentage": 93.76, "elapsed_time": "1 day, 15:40:08", "remaining_time": "2:38:20", "throughput": 332.54, "total_tokens": 47489216} {"current_steps": 37510, "total_steps": 40000, "loss": 0.0605, "lr": 0.0028615595114628188, "epoch": 1.8327755112012314, "percentage": 93.77, "elapsed_time": "1 day, 15:40:12", "remaining_time": "2:38:00", "throughput": 332.57, "total_tokens": 47495648} {"current_steps": 37515, "total_steps": 40000, "loss": 0.0562, "lr": 0.002850119928720074, "epoch": 1.8330198128649258, "percentage": 93.79, "elapsed_time": "1 day, 15:40:15", "remaining_time": "2:37:40", "throughput": 332.61, "total_tokens": 47501568} {"current_steps": 37520, "total_steps": 40000, "loss": 0.0438, "lr": 0.0028387030383380195, "epoch": 1.83326411452862, "percentage": 93.8, "elapsed_time": "1 day, 15:40:18", "remaining_time": "2:37:20", "throughput": 332.65, "total_tokens": 47508384} {"current_steps": 37525, "total_steps": 40000, "loss": 0.0632, "lr": 0.0028273088420772974, "epoch": 1.8335084161923143, "percentage": 93.81, "elapsed_time": "1 day, 15:40:21", "remaining_time": "2:36:59", "throughput": 332.69, "total_tokens": 47514720} {"current_steps": 37530, "total_steps": 40000, "loss": 0.074, "lr": 0.002815937341695068, "epoch": 1.8337527178560085, "percentage": 93.83, "elapsed_time": "1 day, 15:40:24", "remaining_time": "2:36:39", "throughput": 332.72, "total_tokens": 47520736} {"current_steps": 37535, "total_steps": 40000, "loss": 0.0624, "lr": 0.0028045885389448963, "epoch": 1.8339970195197028, "percentage": 93.84, "elapsed_time": "1 day, 15:40:27", "remaining_time": "2:36:19", "throughput": 332.76, "total_tokens": 47527008} {"current_steps": 37540, "total_steps": 40000, "loss": 0.0862, "lr": 0.002793262435576965, "epoch": 1.8342413211833972, "percentage": 93.85, "elapsed_time": "1 day, 15:40:30", "remaining_time": "2:35:59", "throughput": 332.8, "total_tokens": 47533536} {"current_steps": 37545, "total_steps": 40000, "loss": 0.0371, "lr": 0.0027819590333378772, "epoch": 1.8344856228470916, "percentage": 93.86, "elapsed_time": "1 day, 15:40:33", "remaining_time": "2:35:39", "throughput": 332.83, "total_tokens": 47539648} {"current_steps": 37550, "total_steps": 40000, "loss": 0.0468, "lr": 0.002770678333970755, "epoch": 1.834729924510786, "percentage": 93.88, "elapsed_time": "1 day, 15:40:36", "remaining_time": "2:35:19", "throughput": 332.87, "total_tokens": 47546016} {"current_steps": 37555, "total_steps": 40000, "loss": 0.0594, "lr": 0.0027594203392152573, "epoch": 1.8349742261744804, "percentage": 93.89, "elapsed_time": "1 day, 15:40:39", "remaining_time": "2:34:59", "throughput": 332.91, "total_tokens": 47552352} {"current_steps": 37560, "total_steps": 40000, "loss": 0.0604, "lr": 0.002748185050807478, "epoch": 1.8352185278381747, "percentage": 93.9, "elapsed_time": "1 day, 15:40:42", "remaining_time": "2:34:39", "throughput": 332.94, "total_tokens": 47558272} {"current_steps": 37565, "total_steps": 40000, "loss": 0.1239, "lr": 0.002736972470480031, "epoch": 1.835462829501869, "percentage": 93.91, "elapsed_time": "1 day, 15:40:45", "remaining_time": "2:34:19", "throughput": 332.98, "total_tokens": 47564768} {"current_steps": 37570, "total_steps": 40000, "loss": 0.0305, "lr": 0.002725782599962068, "epoch": 1.8357071311655633, "percentage": 93.92, "elapsed_time": "1 day, 15:40:48", "remaining_time": "2:33:59", "throughput": 333.02, "total_tokens": 47571584} {"current_steps": 37575, "total_steps": 40000, "loss": 0.0255, "lr": 0.0027146154409791734, "epoch": 1.8359514328292574, "percentage": 93.94, "elapsed_time": "1 day, 15:40:52", "remaining_time": "2:33:39", "throughput": 333.06, "total_tokens": 47578400} {"current_steps": 37580, "total_steps": 40000, "loss": 0.024, "lr": 0.002703470995253504, "epoch": 1.8361957344929518, "percentage": 93.95, "elapsed_time": "1 day, 15:40:54", "remaining_time": "2:33:19", "throughput": 333.1, "total_tokens": 47584480} {"current_steps": 37585, "total_steps": 40000, "loss": 0.0571, "lr": 0.0026923492645036184, "epoch": 1.8364400361566462, "percentage": 93.96, "elapsed_time": "1 day, 15:40:58", "remaining_time": "2:32:59", "throughput": 333.13, "total_tokens": 47590912} {"current_steps": 37590, "total_steps": 40000, "loss": 0.0413, "lr": 0.0026812502504446776, "epoch": 1.8366843378203406, "percentage": 93.97, "elapsed_time": "1 day, 15:41:01", "remaining_time": "2:32:39", "throughput": 333.17, "total_tokens": 47596992} {"current_steps": 37595, "total_steps": 40000, "loss": 0.063, "lr": 0.0026701739547882798, "epoch": 1.836928639484035, "percentage": 93.99, "elapsed_time": "1 day, 15:41:04", "remaining_time": "2:32:19", "throughput": 333.21, "total_tokens": 47603040} {"current_steps": 37600, "total_steps": 40000, "loss": 0.0445, "lr": 0.0026591203792425077, "epoch": 1.8371729411477293, "percentage": 94.0, "elapsed_time": "1 day, 15:41:07", "remaining_time": "2:31:59", "throughput": 333.24, "total_tokens": 47609472} {"current_steps": 37600, "total_steps": 40000, "eval_loss": 0.06058171018958092, "epoch": 1.8371729411477293, "percentage": 94.0, "elapsed_time": "1 day, 15:51:41", "remaining_time": "2:32:39", "throughput": 331.77, "total_tokens": 47609472} {"current_steps": 37605, "total_steps": 40000, "loss": 0.0557, "lr": 0.0026480895255119818, "epoch": 1.8374172428114237, "percentage": 94.01, "elapsed_time": "1 day, 15:51:46", "remaining_time": "2:32:19", "throughput": 331.8, "total_tokens": 47615456} {"current_steps": 37610, "total_steps": 40000, "loss": 0.0433, "lr": 0.002637081395297791, "epoch": 1.8376615444751179, "percentage": 94.03, "elapsed_time": "1 day, 15:51:49", "remaining_time": "2:31:59", "throughput": 331.84, "total_tokens": 47621728} {"current_steps": 37615, "total_steps": 40000, "loss": 0.0672, "lr": 0.0026260959902975113, "epoch": 1.8379058461388122, "percentage": 94.04, "elapsed_time": "1 day, 15:51:52", "remaining_time": "2:31:39", "throughput": 331.87, "total_tokens": 47628096} {"current_steps": 37620, "total_steps": 40000, "loss": 0.0621, "lr": 0.00261513331220527, "epoch": 1.8381501478025064, "percentage": 94.05, "elapsed_time": "1 day, 15:51:56", "remaining_time": "2:31:19", "throughput": 331.91, "total_tokens": 47634656} {"current_steps": 37625, "total_steps": 40000, "loss": 0.0587, "lr": 0.0026041933627116154, "epoch": 1.8383944494662008, "percentage": 94.06, "elapsed_time": "1 day, 15:51:59", "remaining_time": "2:30:59", "throughput": 331.95, "total_tokens": 47640608} {"current_steps": 37630, "total_steps": 40000, "loss": 0.033, "lr": 0.0025932761435036476, "epoch": 1.8386387511298952, "percentage": 94.08, "elapsed_time": "1 day, 15:52:02", "remaining_time": "2:30:39", "throughput": 331.98, "total_tokens": 47647168} {"current_steps": 37635, "total_steps": 40000, "loss": 0.0516, "lr": 0.002582381656264904, "epoch": 1.8388830527935895, "percentage": 94.09, "elapsed_time": "1 day, 15:52:05", "remaining_time": "2:30:19", "throughput": 332.02, "total_tokens": 47653312} {"current_steps": 37640, "total_steps": 40000, "loss": 0.0576, "lr": 0.0025715099026754895, "epoch": 1.839127354457284, "percentage": 94.1, "elapsed_time": "1 day, 15:52:08", "remaining_time": "2:29:59", "throughput": 332.06, "total_tokens": 47659520} {"current_steps": 37645, "total_steps": 40000, "loss": 0.071, "lr": 0.002560660884411947, "epoch": 1.8393716561209783, "percentage": 94.11, "elapsed_time": "1 day, 15:52:11", "remaining_time": "2:29:39", "throughput": 332.09, "total_tokens": 47665440} {"current_steps": 37650, "total_steps": 40000, "loss": 0.0782, "lr": 0.0025498346031473385, "epoch": 1.8396159577846725, "percentage": 94.12, "elapsed_time": "1 day, 15:52:14", "remaining_time": "2:29:18", "throughput": 332.13, "total_tokens": 47672096} {"current_steps": 37655, "total_steps": 40000, "loss": 0.0619, "lr": 0.0025390310605511945, "epoch": 1.8398602594483668, "percentage": 94.14, "elapsed_time": "1 day, 15:52:17", "remaining_time": "2:28:58", "throughput": 332.16, "total_tokens": 47678112} {"current_steps": 37660, "total_steps": 40000, "loss": 0.0845, "lr": 0.0025282502582895995, "epoch": 1.8401045611120612, "percentage": 94.15, "elapsed_time": "1 day, 15:52:20", "remaining_time": "2:28:38", "throughput": 332.2, "total_tokens": 47684288} {"current_steps": 37665, "total_steps": 40000, "loss": 0.067, "lr": 0.002517492198025023, "epoch": 1.8403488627757554, "percentage": 94.16, "elapsed_time": "1 day, 15:52:23", "remaining_time": "2:28:18", "throughput": 332.24, "total_tokens": 47690720} {"current_steps": 37670, "total_steps": 40000, "loss": 0.0693, "lr": 0.0025067568814165554, "epoch": 1.8405931644394498, "percentage": 94.17, "elapsed_time": "1 day, 15:52:26", "remaining_time": "2:27:58", "throughput": 332.27, "total_tokens": 47696896} {"current_steps": 37675, "total_steps": 40000, "loss": 0.0558, "lr": 0.0024960443101196884, "epoch": 1.8408374661031441, "percentage": 94.19, "elapsed_time": "1 day, 15:52:29", "remaining_time": "2:27:38", "throughput": 332.31, "total_tokens": 47702912} {"current_steps": 37680, "total_steps": 40000, "loss": 0.0451, "lr": 0.002485354485786434, "epoch": 1.8410817677668385, "percentage": 94.2, "elapsed_time": "1 day, 15:52:32", "remaining_time": "2:27:18", "throughput": 332.34, "total_tokens": 47708864} {"current_steps": 37685, "total_steps": 40000, "loss": 0.0466, "lr": 0.002474687410065307, "epoch": 1.841326069430533, "percentage": 94.21, "elapsed_time": "1 day, 15:52:35", "remaining_time": "2:26:58", "throughput": 332.38, "total_tokens": 47715168} {"current_steps": 37690, "total_steps": 40000, "loss": 0.0849, "lr": 0.002464043084601308, "epoch": 1.8415703710942273, "percentage": 94.23, "elapsed_time": "1 day, 15:52:38", "remaining_time": "2:26:38", "throughput": 332.42, "total_tokens": 47721600} {"current_steps": 37695, "total_steps": 40000, "loss": 0.0284, "lr": 0.0024534215110358915, "epoch": 1.8418146727579214, "percentage": 94.24, "elapsed_time": "1 day, 15:52:41", "remaining_time": "2:26:18", "throughput": 332.46, "total_tokens": 47728032} {"current_steps": 37700, "total_steps": 40000, "loss": 0.0618, "lr": 0.002442822691007096, "epoch": 1.8420589744216158, "percentage": 94.25, "elapsed_time": "1 day, 15:52:44", "remaining_time": "2:25:58", "throughput": 332.49, "total_tokens": 47734144} {"current_steps": 37705, "total_steps": 40000, "loss": 0.0866, "lr": 0.002432246626149348, "epoch": 1.8423032760853102, "percentage": 94.26, "elapsed_time": "1 day, 15:52:47", "remaining_time": "2:25:38", "throughput": 332.53, "total_tokens": 47740704} {"current_steps": 37710, "total_steps": 40000, "loss": 0.0381, "lr": 0.002421693318093626, "epoch": 1.8425475777490044, "percentage": 94.27, "elapsed_time": "1 day, 15:52:51", "remaining_time": "2:25:18", "throughput": 332.57, "total_tokens": 47747040} {"current_steps": 37715, "total_steps": 40000, "loss": 0.0606, "lr": 0.0024111627684673784, "epoch": 1.8427918794126987, "percentage": 94.29, "elapsed_time": "1 day, 15:52:54", "remaining_time": "2:24:58", "throughput": 332.6, "total_tokens": 47752960} {"current_steps": 37720, "total_steps": 40000, "loss": 0.0672, "lr": 0.0024006549788945395, "epoch": 1.843036181076393, "percentage": 94.3, "elapsed_time": "1 day, 15:52:57", "remaining_time": "2:24:38", "throughput": 332.64, "total_tokens": 47759488} {"current_steps": 37725, "total_steps": 40000, "loss": 0.0478, "lr": 0.0023901699509955463, "epoch": 1.8432804827400875, "percentage": 94.31, "elapsed_time": "1 day, 15:53:00", "remaining_time": "2:24:18", "throughput": 332.68, "total_tokens": 47765696} {"current_steps": 37730, "total_steps": 40000, "loss": 0.0354, "lr": 0.0023797076863873554, "epoch": 1.8435247844037819, "percentage": 94.33, "elapsed_time": "1 day, 15:53:03", "remaining_time": "2:23:58", "throughput": 332.71, "total_tokens": 47771680} {"current_steps": 37735, "total_steps": 40000, "loss": 0.0524, "lr": 0.0023692681866833262, "epoch": 1.8437690860674762, "percentage": 94.34, "elapsed_time": "1 day, 15:53:06", "remaining_time": "2:23:38", "throughput": 332.75, "total_tokens": 47777952} {"current_steps": 37740, "total_steps": 40000, "loss": 0.0375, "lr": 0.0023588514534934046, "epoch": 1.8440133877311704, "percentage": 94.35, "elapsed_time": "1 day, 15:53:09", "remaining_time": "2:23:18", "throughput": 332.78, "total_tokens": 47784256} {"current_steps": 37745, "total_steps": 40000, "loss": 0.0475, "lr": 0.002348457488423955, "epoch": 1.8442576893948648, "percentage": 94.36, "elapsed_time": "1 day, 15:53:12", "remaining_time": "2:22:58", "throughput": 332.82, "total_tokens": 47790368} {"current_steps": 37750, "total_steps": 40000, "loss": 0.0614, "lr": 0.0023380862930778624, "epoch": 1.844501991058559, "percentage": 94.38, "elapsed_time": "1 day, 15:53:15", "remaining_time": "2:22:38", "throughput": 332.85, "total_tokens": 47796320} {"current_steps": 37755, "total_steps": 40000, "loss": 0.0792, "lr": 0.0023277378690545135, "epoch": 1.8447462927222533, "percentage": 94.39, "elapsed_time": "1 day, 15:53:18", "remaining_time": "2:22:18", "throughput": 332.89, "total_tokens": 47802784} {"current_steps": 37760, "total_steps": 40000, "loss": 0.05, "lr": 0.0023174122179497325, "epoch": 1.8449905943859477, "percentage": 94.4, "elapsed_time": "1 day, 15:53:21", "remaining_time": "2:21:58", "throughput": 332.93, "total_tokens": 47808928} {"current_steps": 37765, "total_steps": 40000, "loss": 0.0426, "lr": 0.0023071093413558784, "epoch": 1.845234896049642, "percentage": 94.41, "elapsed_time": "1 day, 15:53:24", "remaining_time": "2:21:38", "throughput": 332.96, "total_tokens": 47815200} {"current_steps": 37770, "total_steps": 40000, "loss": 0.0521, "lr": 0.002296829240861814, "epoch": 1.8454791977133365, "percentage": 94.42, "elapsed_time": "1 day, 15:53:27", "remaining_time": "2:21:18", "throughput": 333.0, "total_tokens": 47821568} {"current_steps": 37775, "total_steps": 40000, "loss": 0.0442, "lr": 0.002286571918052821, "epoch": 1.8457234993770308, "percentage": 94.44, "elapsed_time": "1 day, 15:53:30", "remaining_time": "2:20:58", "throughput": 333.04, "total_tokens": 47827712} {"current_steps": 37780, "total_steps": 40000, "loss": 0.063, "lr": 0.0022763373745107174, "epoch": 1.8459678010407252, "percentage": 94.45, "elapsed_time": "1 day, 15:53:33", "remaining_time": "2:20:38", "throughput": 333.07, "total_tokens": 47833632} {"current_steps": 37785, "total_steps": 40000, "loss": 0.0759, "lr": 0.0022661256118138074, "epoch": 1.8462121027044194, "percentage": 94.46, "elapsed_time": "1 day, 15:53:36", "remaining_time": "2:20:18", "throughput": 333.11, "total_tokens": 47840000} {"current_steps": 37790, "total_steps": 40000, "loss": 0.0386, "lr": 0.0022559366315368645, "epoch": 1.8464564043681138, "percentage": 94.47, "elapsed_time": "1 day, 15:53:39", "remaining_time": "2:19:59", "throughput": 333.15, "total_tokens": 47846400} {"current_steps": 37795, "total_steps": 40000, "loss": 0.0518, "lr": 0.002245770435251182, "epoch": 1.846700706031808, "percentage": 94.49, "elapsed_time": "1 day, 15:53:42", "remaining_time": "2:19:39", "throughput": 333.18, "total_tokens": 47852768} {"current_steps": 37800, "total_steps": 40000, "loss": 0.0586, "lr": 0.002235627024524456, "epoch": 1.8469450076955023, "percentage": 94.5, "elapsed_time": "1 day, 15:53:46", "remaining_time": "2:19:19", "throughput": 333.22, "total_tokens": 47859360} {"current_steps": 37800, "total_steps": 40000, "eval_loss": 0.06058782339096069, "epoch": 1.8469450076955023, "percentage": 94.5, "elapsed_time": "1 day, 16:04:20", "remaining_time": "2:19:56", "throughput": 331.76, "total_tokens": 47859360} {"current_steps": 37805, "total_steps": 40000, "loss": 0.0452, "lr": 0.0022255064009209847, "epoch": 1.8471893093591967, "percentage": 94.51, "elapsed_time": "1 day, 16:04:24", "remaining_time": "2:19:36", "throughput": 331.79, "total_tokens": 47865920} {"current_steps": 37810, "total_steps": 40000, "loss": 0.0491, "lr": 0.0022154085660014864, "epoch": 1.847433611022891, "percentage": 94.53, "elapsed_time": "1 day, 16:04:27", "remaining_time": "2:19:16", "throughput": 331.83, "total_tokens": 47872416} {"current_steps": 37815, "total_steps": 40000, "loss": 0.0482, "lr": 0.0022053335213231494, "epoch": 1.8476779126865854, "percentage": 94.54, "elapsed_time": "1 day, 16:04:30", "remaining_time": "2:18:56", "throughput": 331.87, "total_tokens": 47879072} {"current_steps": 37820, "total_steps": 40000, "loss": 0.0352, "lr": 0.002195281268439697, "epoch": 1.8479222143502798, "percentage": 94.55, "elapsed_time": "1 day, 16:04:33", "remaining_time": "2:18:36", "throughput": 331.91, "total_tokens": 47885120} {"current_steps": 37825, "total_steps": 40000, "loss": 0.0867, "lr": 0.002185251808901306, "epoch": 1.8481665160139742, "percentage": 94.56, "elapsed_time": "1 day, 16:04:36", "remaining_time": "2:18:16", "throughput": 331.94, "total_tokens": 47891168} {"current_steps": 37830, "total_steps": 40000, "loss": 0.0555, "lr": 0.0021752451442546227, "epoch": 1.8484108176776683, "percentage": 94.58, "elapsed_time": "1 day, 16:04:39", "remaining_time": "2:17:56", "throughput": 331.97, "total_tokens": 47897152} {"current_steps": 37835, "total_steps": 40000, "loss": 0.0423, "lr": 0.0021652612760428456, "epoch": 1.8486551193413627, "percentage": 94.59, "elapsed_time": "1 day, 16:04:42", "remaining_time": "2:17:36", "throughput": 332.01, "total_tokens": 47903104} {"current_steps": 37840, "total_steps": 40000, "loss": 0.0336, "lr": 0.0021553002058055603, "epoch": 1.8488994210050569, "percentage": 94.6, "elapsed_time": "1 day, 16:04:45", "remaining_time": "2:17:16", "throughput": 332.05, "total_tokens": 47909440} {"current_steps": 37845, "total_steps": 40000, "loss": 0.0543, "lr": 0.0021453619350789376, "epoch": 1.8491437226687513, "percentage": 94.61, "elapsed_time": "1 day, 16:04:48", "remaining_time": "2:16:56", "throughput": 332.08, "total_tokens": 47915712} {"current_steps": 37850, "total_steps": 40000, "loss": 0.0625, "lr": 0.0021354464653955516, "epoch": 1.8493880243324456, "percentage": 94.62, "elapsed_time": "1 day, 16:04:51", "remaining_time": "2:16:36", "throughput": 332.12, "total_tokens": 47921760} {"current_steps": 37855, "total_steps": 40000, "loss": 0.0474, "lr": 0.002125553798284513, "epoch": 1.84963232599614, "percentage": 94.64, "elapsed_time": "1 day, 16:04:54", "remaining_time": "2:16:16", "throughput": 332.15, "total_tokens": 47928000} {"current_steps": 37860, "total_steps": 40000, "loss": 0.0508, "lr": 0.002115683935271384, "epoch": 1.8498766276598344, "percentage": 94.65, "elapsed_time": "1 day, 16:04:57", "remaining_time": "2:15:56", "throughput": 332.19, "total_tokens": 47934144} {"current_steps": 37865, "total_steps": 40000, "loss": 0.0609, "lr": 0.0021058368778782144, "epoch": 1.8501209293235288, "percentage": 94.66, "elapsed_time": "1 day, 16:05:00", "remaining_time": "2:15:36", "throughput": 332.23, "total_tokens": 47940512} {"current_steps": 37870, "total_steps": 40000, "loss": 0.0396, "lr": 0.002096012627623539, "epoch": 1.8503652309872232, "percentage": 94.67, "elapsed_time": "1 day, 16:05:03", "remaining_time": "2:15:16", "throughput": 332.26, "total_tokens": 47946720} {"current_steps": 37875, "total_steps": 40000, "loss": 0.0724, "lr": 0.00208621118602243, "epoch": 1.8506095326509173, "percentage": 94.69, "elapsed_time": "1 day, 16:05:06", "remaining_time": "2:14:56", "throughput": 332.3, "total_tokens": 47952928} {"current_steps": 37880, "total_steps": 40000, "loss": 0.0463, "lr": 0.002076432554586327, "epoch": 1.8508538343146117, "percentage": 94.7, "elapsed_time": "1 day, 16:05:09", "remaining_time": "2:14:36", "throughput": 332.34, "total_tokens": 47959296} {"current_steps": 37885, "total_steps": 40000, "loss": 0.0512, "lr": 0.002066676734823258, "epoch": 1.8510981359783059, "percentage": 94.71, "elapsed_time": "1 day, 16:05:12", "remaining_time": "2:14:16", "throughput": 332.37, "total_tokens": 47965216} {"current_steps": 37890, "total_steps": 40000, "loss": 0.0555, "lr": 0.0020569437282376866, "epoch": 1.8513424376420002, "percentage": 94.73, "elapsed_time": "1 day, 16:05:15", "remaining_time": "2:13:56", "throughput": 332.41, "total_tokens": 47972096} {"current_steps": 37895, "total_steps": 40000, "loss": 0.051, "lr": 0.002047233536330545, "epoch": 1.8515867393056946, "percentage": 94.74, "elapsed_time": "1 day, 16:05:18", "remaining_time": "2:13:36", "throughput": 332.45, "total_tokens": 47978528} {"current_steps": 37900, "total_steps": 40000, "loss": 0.0689, "lr": 0.0020375461605993015, "epoch": 1.851831040969389, "percentage": 94.75, "elapsed_time": "1 day, 16:05:22", "remaining_time": "2:13:16", "throughput": 332.48, "total_tokens": 47984800} {"current_steps": 37905, "total_steps": 40000, "loss": 0.0448, "lr": 0.002027881602537845, "epoch": 1.8520753426330834, "percentage": 94.76, "elapsed_time": "1 day, 16:05:25", "remaining_time": "2:12:56", "throughput": 332.52, "total_tokens": 47990912} {"current_steps": 37910, "total_steps": 40000, "loss": 0.0801, "lr": 0.002018239863636567, "epoch": 1.8523196442967778, "percentage": 94.77, "elapsed_time": "1 day, 16:05:28", "remaining_time": "2:12:36", "throughput": 332.56, "total_tokens": 47997120} {"current_steps": 37915, "total_steps": 40000, "loss": 0.0343, "lr": 0.002008620945382378, "epoch": 1.8525639459604721, "percentage": 94.79, "elapsed_time": "1 day, 16:05:31", "remaining_time": "2:12:16", "throughput": 332.59, "total_tokens": 48003488} {"current_steps": 37920, "total_steps": 40000, "loss": 0.0764, "lr": 0.001999024849258607, "epoch": 1.8528082476241663, "percentage": 94.8, "elapsed_time": "1 day, 16:05:34", "remaining_time": "2:11:57", "throughput": 332.63, "total_tokens": 48009696} {"current_steps": 37925, "total_steps": 40000, "loss": 0.0429, "lr": 0.001989451576745105, "epoch": 1.8530525492878607, "percentage": 94.81, "elapsed_time": "1 day, 16:05:37", "remaining_time": "2:11:37", "throughput": 332.67, "total_tokens": 48016192} {"current_steps": 37930, "total_steps": 40000, "loss": 0.0816, "lr": 0.00197990112931819, "epoch": 1.8532968509515548, "percentage": 94.83, "elapsed_time": "1 day, 16:05:40", "remaining_time": "2:11:17", "throughput": 332.7, "total_tokens": 48022656} {"current_steps": 37935, "total_steps": 40000, "loss": 0.0658, "lr": 0.0019703735084506345, "epoch": 1.8535411526152492, "percentage": 94.84, "elapsed_time": "1 day, 16:05:43", "remaining_time": "2:10:57", "throughput": 332.74, "total_tokens": 48029088} {"current_steps": 37940, "total_steps": 40000, "loss": 0.0423, "lr": 0.001960868715611763, "epoch": 1.8537854542789436, "percentage": 94.85, "elapsed_time": "1 day, 16:05:46", "remaining_time": "2:10:37", "throughput": 332.78, "total_tokens": 48035584} {"current_steps": 37945, "total_steps": 40000, "loss": 0.0902, "lr": 0.0019513867522673034, "epoch": 1.854029755942638, "percentage": 94.86, "elapsed_time": "1 day, 16:05:49", "remaining_time": "2:10:17", "throughput": 332.81, "total_tokens": 48041440} {"current_steps": 37950, "total_steps": 40000, "loss": 0.0446, "lr": 0.001941927619879502, "epoch": 1.8542740576063323, "percentage": 94.88, "elapsed_time": "1 day, 16:05:52", "remaining_time": "2:09:57", "throughput": 332.85, "total_tokens": 48047872} {"current_steps": 37955, "total_steps": 40000, "loss": 0.0679, "lr": 0.0019324913199070758, "epoch": 1.8545183592700267, "percentage": 94.89, "elapsed_time": "1 day, 16:05:55", "remaining_time": "2:09:37", "throughput": 332.89, "total_tokens": 48054016} {"current_steps": 37960, "total_steps": 40000, "loss": 0.0564, "lr": 0.0019230778538052106, "epoch": 1.854762660933721, "percentage": 94.9, "elapsed_time": "1 day, 16:05:58", "remaining_time": "2:09:17", "throughput": 332.92, "total_tokens": 48060352} {"current_steps": 37965, "total_steps": 40000, "loss": 0.0555, "lr": 0.0019136872230255952, "epoch": 1.8550069625974153, "percentage": 94.91, "elapsed_time": "1 day, 16:06:01", "remaining_time": "2:08:58", "throughput": 332.96, "total_tokens": 48066464} {"current_steps": 37970, "total_steps": 40000, "loss": 0.0732, "lr": 0.0019043194290164045, "epoch": 1.8552512642611096, "percentage": 94.92, "elapsed_time": "1 day, 16:06:05", "remaining_time": "2:08:38", "throughput": 333.0, "total_tokens": 48073216} {"current_steps": 37975, "total_steps": 40000, "loss": 0.0619, "lr": 0.0018949744732222162, "epoch": 1.8554955659248038, "percentage": 94.94, "elapsed_time": "1 day, 16:06:08", "remaining_time": "2:08:18", "throughput": 333.03, "total_tokens": 48079296} {"current_steps": 37980, "total_steps": 40000, "loss": 0.0452, "lr": 0.0018856523570841776, "epoch": 1.8557398675884982, "percentage": 94.95, "elapsed_time": "1 day, 16:06:11", "remaining_time": "2:07:58", "throughput": 333.07, "total_tokens": 48085696} {"current_steps": 37985, "total_steps": 40000, "loss": 0.0869, "lr": 0.0018763530820398555, "epoch": 1.8559841692521926, "percentage": 94.96, "elapsed_time": "1 day, 16:06:14", "remaining_time": "2:07:38", "throughput": 333.11, "total_tokens": 48092032} {"current_steps": 37990, "total_steps": 40000, "loss": 0.0443, "lr": 0.0018670766495233525, "epoch": 1.856228470915887, "percentage": 94.97, "elapsed_time": "1 day, 16:06:17", "remaining_time": "2:07:18", "throughput": 333.14, "total_tokens": 48098272} {"current_steps": 37995, "total_steps": 40000, "loss": 0.0779, "lr": 0.001857823060965158, "epoch": 1.8564727725795813, "percentage": 94.99, "elapsed_time": "1 day, 16:06:20", "remaining_time": "2:06:58", "throughput": 333.18, "total_tokens": 48104544} {"current_steps": 38000, "total_steps": 40000, "loss": 0.0785, "lr": 0.0018485923177923467, "epoch": 1.8567170742432757, "percentage": 95.0, "elapsed_time": "1 day, 16:06:23", "remaining_time": "2:06:39", "throughput": 333.22, "total_tokens": 48110912} {"current_steps": 38000, "total_steps": 40000, "eval_loss": 0.06050892546772957, "epoch": 1.8567170742432757, "percentage": 95.0, "elapsed_time": "1 day, 16:16:57", "remaining_time": "2:07:12", "throughput": 331.76, "total_tokens": 48110912} {"current_steps": 38005, "total_steps": 40000, "loss": 0.0436, "lr": 0.001839384421428364, "epoch": 1.85696137590697, "percentage": 95.01, "elapsed_time": "1 day, 16:17:01", "remaining_time": "2:06:52", "throughput": 331.8, "total_tokens": 48118080} {"current_steps": 38010, "total_steps": 40000, "loss": 0.0567, "lr": 0.0018301993732932065, "epoch": 1.8572056775706642, "percentage": 95.03, "elapsed_time": "1 day, 16:17:04", "remaining_time": "2:06:32", "throughput": 331.84, "total_tokens": 48124608} {"current_steps": 38015, "total_steps": 40000, "loss": 0.0885, "lr": 0.0018210371748033248, "epoch": 1.8574499792343586, "percentage": 95.04, "elapsed_time": "1 day, 16:17:07", "remaining_time": "2:06:12", "throughput": 331.87, "total_tokens": 48130816} {"current_steps": 38020, "total_steps": 40000, "loss": 0.0665, "lr": 0.0018118978273716556, "epoch": 1.8576942808980528, "percentage": 95.05, "elapsed_time": "1 day, 16:17:10", "remaining_time": "2:05:52", "throughput": 331.91, "total_tokens": 48137440} {"current_steps": 38025, "total_steps": 40000, "loss": 0.0501, "lr": 0.001802781332407588, "epoch": 1.8579385825617472, "percentage": 95.06, "elapsed_time": "1 day, 16:17:13", "remaining_time": "2:05:32", "throughput": 331.95, "total_tokens": 48143296} {"current_steps": 38030, "total_steps": 40000, "loss": 0.0553, "lr": 0.0017936876913169806, "epoch": 1.8581828842254415, "percentage": 95.08, "elapsed_time": "1 day, 16:17:16", "remaining_time": "2:05:13", "throughput": 331.98, "total_tokens": 48149696} {"current_steps": 38035, "total_steps": 40000, "loss": 0.0876, "lr": 0.0017846169055022287, "epoch": 1.858427185889136, "percentage": 95.09, "elapsed_time": "1 day, 16:17:19", "remaining_time": "2:04:53", "throughput": 332.02, "total_tokens": 48155584} {"current_steps": 38040, "total_steps": 40000, "loss": 0.0652, "lr": 0.0017755689763621295, "epoch": 1.8586714875528303, "percentage": 95.1, "elapsed_time": "1 day, 16:17:22", "remaining_time": "2:04:33", "throughput": 332.05, "total_tokens": 48161728} {"current_steps": 38045, "total_steps": 40000, "loss": 0.0596, "lr": 0.0017665439052920173, "epoch": 1.8589157892165247, "percentage": 95.11, "elapsed_time": "1 day, 16:17:25", "remaining_time": "2:04:13", "throughput": 332.09, "total_tokens": 48167904} {"current_steps": 38050, "total_steps": 40000, "loss": 0.0841, "lr": 0.0017575416936836286, "epoch": 1.859160090880219, "percentage": 95.12, "elapsed_time": "1 day, 16:17:28", "remaining_time": "2:03:53", "throughput": 332.12, "total_tokens": 48174272} {"current_steps": 38055, "total_steps": 40000, "loss": 0.0499, "lr": 0.0017485623429252528, "epoch": 1.8594043925439132, "percentage": 95.14, "elapsed_time": "1 day, 16:17:31", "remaining_time": "2:03:33", "throughput": 332.16, "total_tokens": 48180864} {"current_steps": 38060, "total_steps": 40000, "loss": 0.0951, "lr": 0.0017396058544016156, "epoch": 1.8596486942076076, "percentage": 95.15, "elapsed_time": "1 day, 16:17:34", "remaining_time": "2:03:13", "throughput": 332.2, "total_tokens": 48187456} {"current_steps": 38065, "total_steps": 40000, "loss": 0.0681, "lr": 0.0017306722294938958, "epoch": 1.8598929958713017, "percentage": 95.16, "elapsed_time": "1 day, 16:17:37", "remaining_time": "2:02:53", "throughput": 332.24, "total_tokens": 48193440} {"current_steps": 38070, "total_steps": 40000, "loss": 0.0472, "lr": 0.0017217614695798078, "epoch": 1.8601372975349961, "percentage": 95.17, "elapsed_time": "1 day, 16:17:40", "remaining_time": "2:02:34", "throughput": 332.27, "total_tokens": 48199648} {"current_steps": 38075, "total_steps": 40000, "loss": 0.0857, "lr": 0.001712873576033469, "epoch": 1.8603815991986905, "percentage": 95.19, "elapsed_time": "1 day, 16:17:43", "remaining_time": "2:02:14", "throughput": 332.31, "total_tokens": 48205696} {"current_steps": 38080, "total_steps": 40000, "loss": 0.0544, "lr": 0.0017040085502255163, "epoch": 1.8606259008623849, "percentage": 95.2, "elapsed_time": "1 day, 16:17:47", "remaining_time": "2:01:54", "throughput": 332.34, "total_tokens": 48212128} {"current_steps": 38085, "total_steps": 40000, "loss": 0.0408, "lr": 0.0016951663935230565, "epoch": 1.8608702025260793, "percentage": 95.21, "elapsed_time": "1 day, 16:17:50", "remaining_time": "2:01:34", "throughput": 332.38, "total_tokens": 48218432} {"current_steps": 38090, "total_steps": 40000, "loss": 0.0537, "lr": 0.0016863471072896485, "epoch": 1.8611145041897736, "percentage": 95.23, "elapsed_time": "1 day, 16:17:53", "remaining_time": "2:01:14", "throughput": 332.42, "total_tokens": 48224832} {"current_steps": 38095, "total_steps": 40000, "loss": 0.0341, "lr": 0.0016775506928853377, "epoch": 1.861358805853468, "percentage": 95.24, "elapsed_time": "1 day, 16:17:56", "remaining_time": "2:00:54", "throughput": 332.45, "total_tokens": 48230848} {"current_steps": 38100, "total_steps": 40000, "loss": 0.0515, "lr": 0.001668777151666656, "epoch": 1.8616031075171622, "percentage": 95.25, "elapsed_time": "1 day, 16:17:59", "remaining_time": "2:00:34", "throughput": 332.49, "total_tokens": 48237152} {"current_steps": 38105, "total_steps": 40000, "loss": 0.0712, "lr": 0.0016600264849865709, "epoch": 1.8618474091808566, "percentage": 95.26, "elapsed_time": "1 day, 16:18:02", "remaining_time": "2:00:15", "throughput": 332.52, "total_tokens": 48243200} {"current_steps": 38110, "total_steps": 40000, "loss": 0.053, "lr": 0.0016512986941945695, "epoch": 1.8620917108445507, "percentage": 95.28, "elapsed_time": "1 day, 16:18:05", "remaining_time": "1:59:55", "throughput": 332.56, "total_tokens": 48249440} {"current_steps": 38115, "total_steps": 40000, "loss": 0.0649, "lr": 0.0016425937806365753, "epoch": 1.862336012508245, "percentage": 95.29, "elapsed_time": "1 day, 16:18:08", "remaining_time": "1:59:35", "throughput": 332.59, "total_tokens": 48255584} {"current_steps": 38120, "total_steps": 40000, "loss": 0.0394, "lr": 0.0016339117456549979, "epoch": 1.8625803141719395, "percentage": 95.3, "elapsed_time": "1 day, 16:18:11", "remaining_time": "1:59:15", "throughput": 332.64, "total_tokens": 48262528} {"current_steps": 38125, "total_steps": 40000, "loss": 0.0641, "lr": 0.0016252525905886995, "epoch": 1.8628246158356339, "percentage": 95.31, "elapsed_time": "1 day, 16:18:14", "remaining_time": "1:58:55", "throughput": 332.67, "total_tokens": 48268832} {"current_steps": 38130, "total_steps": 40000, "loss": 0.0582, "lr": 0.0016166163167730617, "epoch": 1.8630689174993282, "percentage": 95.33, "elapsed_time": "1 day, 16:18:17", "remaining_time": "1:58:35", "throughput": 332.7, "total_tokens": 48274592} {"current_steps": 38135, "total_steps": 40000, "loss": 0.0841, "lr": 0.0016080029255398864, "epoch": 1.8633132191630226, "percentage": 95.34, "elapsed_time": "1 day, 16:18:20", "remaining_time": "1:58:16", "throughput": 332.74, "total_tokens": 48281056} {"current_steps": 38140, "total_steps": 40000, "loss": 0.046, "lr": 0.0015994124182174606, "epoch": 1.863557520826717, "percentage": 95.35, "elapsed_time": "1 day, 16:18:23", "remaining_time": "1:57:56", "throughput": 332.78, "total_tokens": 48287584} {"current_steps": 38145, "total_steps": 40000, "loss": 0.0595, "lr": 0.001590844796130575, "epoch": 1.8638018224904112, "percentage": 95.36, "elapsed_time": "1 day, 16:18:26", "remaining_time": "1:57:36", "throughput": 332.82, "total_tokens": 48293984} {"current_steps": 38150, "total_steps": 40000, "loss": 0.077, "lr": 0.001582300060600439, "epoch": 1.8640461241541055, "percentage": 95.38, "elapsed_time": "1 day, 16:18:29", "remaining_time": "1:57:16", "throughput": 332.85, "total_tokens": 48300160} {"current_steps": 38155, "total_steps": 40000, "loss": 0.0478, "lr": 0.0015737782129447652, "epoch": 1.8642904258177997, "percentage": 95.39, "elapsed_time": "1 day, 16:18:32", "remaining_time": "1:56:56", "throughput": 332.89, "total_tokens": 48306752} {"current_steps": 38160, "total_steps": 40000, "loss": 0.0856, "lr": 0.0015652792544777361, "epoch": 1.864534727481494, "percentage": 95.4, "elapsed_time": "1 day, 16:18:35", "remaining_time": "1:56:37", "throughput": 332.93, "total_tokens": 48312928} {"current_steps": 38165, "total_steps": 40000, "loss": 0.0368, "lr": 0.0015568031865099863, "epoch": 1.8647790291451884, "percentage": 95.41, "elapsed_time": "1 day, 16:18:38", "remaining_time": "1:56:17", "throughput": 332.96, "total_tokens": 48318944} {"current_steps": 38170, "total_steps": 40000, "loss": 0.0497, "lr": 0.0015483500103486369, "epoch": 1.8650233308088828, "percentage": 95.43, "elapsed_time": "1 day, 16:18:41", "remaining_time": "1:55:57", "throughput": 333.0, "total_tokens": 48325216} {"current_steps": 38175, "total_steps": 40000, "loss": 0.0394, "lr": 0.0015399197272972787, "epoch": 1.8652676324725772, "percentage": 95.44, "elapsed_time": "1 day, 16:18:45", "remaining_time": "1:55:37", "throughput": 333.03, "total_tokens": 48331584} {"current_steps": 38180, "total_steps": 40000, "loss": 0.0459, "lr": 0.0015315123386559714, "epoch": 1.8655119341362716, "percentage": 95.45, "elapsed_time": "1 day, 16:18:47", "remaining_time": "1:55:18", "throughput": 333.07, "total_tokens": 48337632} {"current_steps": 38185, "total_steps": 40000, "loss": 0.073, "lr": 0.0015231278457212283, "epoch": 1.8657562357999657, "percentage": 95.46, "elapsed_time": "1 day, 16:18:51", "remaining_time": "1:54:58", "throughput": 333.11, "total_tokens": 48344160} {"current_steps": 38190, "total_steps": 40000, "loss": 0.0382, "lr": 0.001514766249786048, "epoch": 1.8660005374636601, "percentage": 95.47, "elapsed_time": "1 day, 16:18:54", "remaining_time": "1:54:38", "throughput": 333.14, "total_tokens": 48350304} {"current_steps": 38195, "total_steps": 40000, "loss": 0.0553, "lr": 0.0015064275521398994, "epoch": 1.8662448391273545, "percentage": 95.49, "elapsed_time": "1 day, 16:18:57", "remaining_time": "1:54:18", "throughput": 333.18, "total_tokens": 48356224} {"current_steps": 38200, "total_steps": 40000, "loss": 0.0686, "lr": 0.0014981117540686872, "epoch": 1.8664891407910487, "percentage": 95.5, "elapsed_time": "1 day, 16:19:00", "remaining_time": "1:53:59", "throughput": 333.21, "total_tokens": 48362560} {"current_steps": 38200, "total_steps": 40000, "eval_loss": 0.06052229925990105, "epoch": 1.8664891407910487, "percentage": 95.5, "elapsed_time": "1 day, 16:29:33", "remaining_time": "1:54:28", "throughput": 331.76, "total_tokens": 48362560} {"current_steps": 38205, "total_steps": 40000, "loss": 0.0628, "lr": 0.0014898188568548687, "epoch": 1.866733442454743, "percentage": 95.51, "elapsed_time": "1 day, 16:29:37", "remaining_time": "1:54:09", "throughput": 331.8, "total_tokens": 48368800} {"current_steps": 38210, "total_steps": 40000, "loss": 0.0778, "lr": 0.0014815488617772542, "epoch": 1.8669777441184374, "percentage": 95.53, "elapsed_time": "1 day, 16:29:40", "remaining_time": "1:53:49", "throughput": 331.84, "total_tokens": 48375232} {"current_steps": 38215, "total_steps": 40000, "loss": 0.0594, "lr": 0.0014733017701112072, "epoch": 1.8672220457821318, "percentage": 95.54, "elapsed_time": "1 day, 16:29:44", "remaining_time": "1:53:29", "throughput": 331.87, "total_tokens": 48381920} {"current_steps": 38220, "total_steps": 40000, "loss": 0.0408, "lr": 0.0014650775831285435, "epoch": 1.8674663474458262, "percentage": 95.55, "elapsed_time": "1 day, 16:29:47", "remaining_time": "1:53:09", "throughput": 331.91, "total_tokens": 48388160} {"current_steps": 38225, "total_steps": 40000, "loss": 0.0571, "lr": 0.001456876302097515, "epoch": 1.8677106491095206, "percentage": 95.56, "elapsed_time": "1 day, 16:29:50", "remaining_time": "1:52:49", "throughput": 331.94, "total_tokens": 48394176} {"current_steps": 38230, "total_steps": 40000, "loss": 0.0697, "lr": 0.0014486979282828604, "epoch": 1.8679549507732147, "percentage": 95.58, "elapsed_time": "1 day, 16:29:53", "remaining_time": "1:52:30", "throughput": 331.98, "total_tokens": 48400512} {"current_steps": 38235, "total_steps": 40000, "loss": 0.0517, "lr": 0.001440542462945804, "epoch": 1.868199252436909, "percentage": 95.59, "elapsed_time": "1 day, 16:29:56", "remaining_time": "1:52:10", "throughput": 332.02, "total_tokens": 48406784} {"current_steps": 38240, "total_steps": 40000, "loss": 0.0504, "lr": 0.0014324099073440232, "epoch": 1.8684435541006035, "percentage": 95.6, "elapsed_time": "1 day, 16:29:59", "remaining_time": "1:51:50", "throughput": 332.05, "total_tokens": 48412960} {"current_steps": 38245, "total_steps": 40000, "loss": 0.0755, "lr": 0.0014243002627316482, "epoch": 1.8686878557642976, "percentage": 95.61, "elapsed_time": "1 day, 16:30:02", "remaining_time": "1:51:30", "throughput": 332.09, "total_tokens": 48419488} {"current_steps": 38250, "total_steps": 40000, "loss": 0.0602, "lr": 0.0014162135303592781, "epoch": 1.868932157427992, "percentage": 95.62, "elapsed_time": "1 day, 16:30:05", "remaining_time": "1:51:10", "throughput": 332.13, "total_tokens": 48425664} {"current_steps": 38255, "total_steps": 40000, "loss": 0.0586, "lr": 0.001408149711474016, "epoch": 1.8691764590916864, "percentage": 95.64, "elapsed_time": "1 day, 16:30:08", "remaining_time": "1:50:51", "throughput": 332.16, "total_tokens": 48432416} {"current_steps": 38260, "total_steps": 40000, "loss": 0.0665, "lr": 0.0014001088073193834, "epoch": 1.8694207607553808, "percentage": 95.65, "elapsed_time": "1 day, 16:30:11", "remaining_time": "1:50:31", "throughput": 332.2, "total_tokens": 48438976} {"current_steps": 38265, "total_steps": 40000, "loss": 0.0665, "lr": 0.0013920908191354052, "epoch": 1.8696650624190752, "percentage": 95.66, "elapsed_time": "1 day, 16:30:14", "remaining_time": "1:50:11", "throughput": 332.24, "total_tokens": 48445152} {"current_steps": 38270, "total_steps": 40000, "loss": 0.0507, "lr": 0.001384095748158526, "epoch": 1.8699093640827695, "percentage": 95.67, "elapsed_time": "1 day, 16:30:17", "remaining_time": "1:49:51", "throughput": 332.27, "total_tokens": 48451104} {"current_steps": 38275, "total_steps": 40000, "loss": 0.0648, "lr": 0.0013761235956217255, "epoch": 1.8701536657464637, "percentage": 95.69, "elapsed_time": "1 day, 16:30:20", "remaining_time": "1:49:31", "throughput": 332.31, "total_tokens": 48457184} {"current_steps": 38280, "total_steps": 40000, "loss": 0.0795, "lr": 0.0013681743627543873, "epoch": 1.870397967410158, "percentage": 95.7, "elapsed_time": "1 day, 16:30:23", "remaining_time": "1:49:12", "throughput": 332.34, "total_tokens": 48463232} {"current_steps": 38285, "total_steps": 40000, "loss": 0.0554, "lr": 0.001360248050782381, "epoch": 1.8706422690738524, "percentage": 95.71, "elapsed_time": "1 day, 16:30:26", "remaining_time": "1:48:52", "throughput": 332.37, "total_tokens": 48469088} {"current_steps": 38290, "total_steps": 40000, "loss": 0.0487, "lr": 0.001352344660928062, "epoch": 1.8708865707375466, "percentage": 95.73, "elapsed_time": "1 day, 16:30:29", "remaining_time": "1:48:32", "throughput": 332.41, "total_tokens": 48475648} {"current_steps": 38295, "total_steps": 40000, "loss": 0.0522, "lr": 0.0013444641944102052, "epoch": 1.871130872401241, "percentage": 95.74, "elapsed_time": "1 day, 16:30:32", "remaining_time": "1:48:12", "throughput": 332.45, "total_tokens": 48481504} {"current_steps": 38300, "total_steps": 40000, "loss": 0.0482, "lr": 0.0013366066524441056, "epoch": 1.8713751740649354, "percentage": 95.75, "elapsed_time": "1 day, 16:30:35", "remaining_time": "1:47:53", "throughput": 332.48, "total_tokens": 48487904} {"current_steps": 38305, "total_steps": 40000, "loss": 0.0664, "lr": 0.0013287720362414768, "epoch": 1.8716194757286297, "percentage": 95.76, "elapsed_time": "1 day, 16:30:38", "remaining_time": "1:47:33", "throughput": 332.52, "total_tokens": 48494432} {"current_steps": 38310, "total_steps": 40000, "loss": 0.0634, "lr": 0.0013209603470105025, "epoch": 1.8718637773923241, "percentage": 95.78, "elapsed_time": "1 day, 16:30:41", "remaining_time": "1:47:13", "throughput": 332.56, "total_tokens": 48500832} {"current_steps": 38315, "total_steps": 40000, "loss": 0.0815, "lr": 0.0013131715859558857, "epoch": 1.8721080790560185, "percentage": 95.79, "elapsed_time": "1 day, 16:30:45", "remaining_time": "1:46:53", "throughput": 332.59, "total_tokens": 48507296} {"current_steps": 38320, "total_steps": 40000, "loss": 0.058, "lr": 0.001305405754278699, "epoch": 1.8723523807197127, "percentage": 95.8, "elapsed_time": "1 day, 16:30:48", "remaining_time": "1:46:34", "throughput": 332.63, "total_tokens": 48513408} {"current_steps": 38325, "total_steps": 40000, "loss": 0.0611, "lr": 0.0012976628531765843, "epoch": 1.872596682383407, "percentage": 95.81, "elapsed_time": "1 day, 16:30:51", "remaining_time": "1:46:14", "throughput": 332.66, "total_tokens": 48519392} {"current_steps": 38330, "total_steps": 40000, "loss": 0.0619, "lr": 0.0012899428838435533, "epoch": 1.8728409840471012, "percentage": 95.83, "elapsed_time": "1 day, 16:30:54", "remaining_time": "1:45:54", "throughput": 332.7, "total_tokens": 48525312} {"current_steps": 38335, "total_steps": 40000, "loss": 0.0532, "lr": 0.001282245847470137, "epoch": 1.8730852857107956, "percentage": 95.84, "elapsed_time": "1 day, 16:30:56", "remaining_time": "1:45:34", "throughput": 332.73, "total_tokens": 48531136} {"current_steps": 38340, "total_steps": 40000, "loss": 0.0599, "lr": 0.001274571745243319, "epoch": 1.87332958737449, "percentage": 95.85, "elapsed_time": "1 day, 16:31:00", "remaining_time": "1:45:15", "throughput": 332.77, "total_tokens": 48537312} {"current_steps": 38345, "total_steps": 40000, "loss": 0.0493, "lr": 0.0012669205783465364, "epoch": 1.8735738890381843, "percentage": 95.86, "elapsed_time": "1 day, 16:31:03", "remaining_time": "1:44:55", "throughput": 332.8, "total_tokens": 48543456} {"current_steps": 38350, "total_steps": 40000, "loss": 0.0818, "lr": 0.001259292347959695, "epoch": 1.8738181907018787, "percentage": 95.88, "elapsed_time": "1 day, 16:31:06", "remaining_time": "1:44:35", "throughput": 332.84, "total_tokens": 48549856} {"current_steps": 38355, "total_steps": 40000, "loss": 0.0607, "lr": 0.0012516870552591707, "epoch": 1.874062492365573, "percentage": 95.89, "elapsed_time": "1 day, 16:31:09", "remaining_time": "1:44:16", "throughput": 332.87, "total_tokens": 48556064} {"current_steps": 38360, "total_steps": 40000, "loss": 0.0629, "lr": 0.001244104701417792, "epoch": 1.8743067940292675, "percentage": 95.9, "elapsed_time": "1 day, 16:31:12", "remaining_time": "1:43:56", "throughput": 332.91, "total_tokens": 48562400} {"current_steps": 38365, "total_steps": 40000, "loss": 0.0546, "lr": 0.0012365452876048565, "epoch": 1.8745510956929616, "percentage": 95.91, "elapsed_time": "1 day, 16:31:15", "remaining_time": "1:43:36", "throughput": 332.95, "total_tokens": 48568864} {"current_steps": 38370, "total_steps": 40000, "loss": 0.0513, "lr": 0.001229008814986099, "epoch": 1.874795397356656, "percentage": 95.93, "elapsed_time": "1 day, 16:31:18", "remaining_time": "1:43:17", "throughput": 332.98, "total_tokens": 48575168} {"current_steps": 38375, "total_steps": 40000, "loss": 0.0644, "lr": 0.0012214952847237725, "epoch": 1.8750396990203502, "percentage": 95.94, "elapsed_time": "1 day, 16:31:21", "remaining_time": "1:42:57", "throughput": 333.02, "total_tokens": 48581344} {"current_steps": 38380, "total_steps": 40000, "loss": 0.0754, "lr": 0.0012140046979765339, "epoch": 1.8752840006840445, "percentage": 95.95, "elapsed_time": "1 day, 16:31:24", "remaining_time": "1:42:37", "throughput": 333.05, "total_tokens": 48587456} {"current_steps": 38385, "total_steps": 40000, "loss": 0.0566, "lr": 0.0012065370558995258, "epoch": 1.875528302347739, "percentage": 95.96, "elapsed_time": "1 day, 16:31:27", "remaining_time": "1:42:18", "throughput": 333.09, "total_tokens": 48594208} {"current_steps": 38390, "total_steps": 40000, "loss": 0.0448, "lr": 0.0011990923596443602, "epoch": 1.8757726040114333, "percentage": 95.97, "elapsed_time": "1 day, 16:31:30", "remaining_time": "1:41:58", "throughput": 333.13, "total_tokens": 48600960} {"current_steps": 38395, "total_steps": 40000, "loss": 0.0886, "lr": 0.001191670610359119, "epoch": 1.8760169056751277, "percentage": 95.99, "elapsed_time": "1 day, 16:31:33", "remaining_time": "1:41:38", "throughput": 333.17, "total_tokens": 48607104} {"current_steps": 38400, "total_steps": 40000, "loss": 0.0538, "lr": 0.0011842718091882865, "epoch": 1.876261207338822, "percentage": 96.0, "elapsed_time": "1 day, 16:31:36", "remaining_time": "1:41:19", "throughput": 333.2, "total_tokens": 48613184} {"current_steps": 38400, "total_steps": 40000, "eval_loss": 0.06046809256076813, "epoch": 1.876261207338822, "percentage": 96.0, "elapsed_time": "1 day, 16:42:11", "remaining_time": "1:41:45", "throughput": 331.76, "total_tokens": 48613184} {"current_steps": 38405, "total_steps": 40000, "loss": 0.0823, "lr": 0.0011768959572729, "epoch": 1.8765055090025164, "percentage": 96.01, "elapsed_time": "1 day, 16:42:15", "remaining_time": "1:41:25", "throughput": 331.79, "total_tokens": 48619424} {"current_steps": 38410, "total_steps": 40000, "loss": 0.0571, "lr": 0.001169543055750366, "epoch": 1.8767498106662106, "percentage": 96.03, "elapsed_time": "1 day, 16:42:18", "remaining_time": "1:41:06", "throughput": 331.83, "total_tokens": 48625760} {"current_steps": 38415, "total_steps": 40000, "loss": 0.0674, "lr": 0.0011622131057546115, "epoch": 1.876994112329905, "percentage": 96.04, "elapsed_time": "1 day, 16:42:21", "remaining_time": "1:40:46", "throughput": 331.87, "total_tokens": 48632032} {"current_steps": 38420, "total_steps": 40000, "loss": 0.0844, "lr": 0.0011549061084160316, "epoch": 1.8772384139935991, "percentage": 96.05, "elapsed_time": "1 day, 16:42:24", "remaining_time": "1:40:26", "throughput": 331.9, "total_tokens": 48638176} {"current_steps": 38425, "total_steps": 40000, "loss": 0.0745, "lr": 0.0011476220648614088, "epoch": 1.8774827156572935, "percentage": 96.06, "elapsed_time": "1 day, 16:42:27", "remaining_time": "1:40:06", "throughput": 331.93, "total_tokens": 48644192} {"current_steps": 38430, "total_steps": 40000, "loss": 0.0384, "lr": 0.0011403609762140777, "epoch": 1.877727017320988, "percentage": 96.08, "elapsed_time": "1 day, 16:42:30", "remaining_time": "1:39:47", "throughput": 331.97, "total_tokens": 48650880} {"current_steps": 38435, "total_steps": 40000, "loss": 0.0599, "lr": 0.0011331228435937756, "epoch": 1.8779713189846823, "percentage": 96.09, "elapsed_time": "1 day, 16:42:33", "remaining_time": "1:39:27", "throughput": 332.01, "total_tokens": 48657344} {"current_steps": 38440, "total_steps": 40000, "loss": 0.0424, "lr": 0.0011259076681166935, "epoch": 1.8782156206483767, "percentage": 96.1, "elapsed_time": "1 day, 16:42:36", "remaining_time": "1:39:07", "throughput": 332.04, "total_tokens": 48663392} {"current_steps": 38445, "total_steps": 40000, "loss": 0.0629, "lr": 0.0011187154508955244, "epoch": 1.878459922312071, "percentage": 96.11, "elapsed_time": "1 day, 16:42:39", "remaining_time": "1:38:47", "throughput": 332.08, "total_tokens": 48669728} {"current_steps": 38450, "total_steps": 40000, "loss": 0.0598, "lr": 0.001111546193039381, "epoch": 1.8787042239757654, "percentage": 96.12, "elapsed_time": "1 day, 16:42:42", "remaining_time": "1:38:28", "throughput": 332.12, "total_tokens": 48676224} {"current_steps": 38455, "total_steps": 40000, "loss": 0.0499, "lr": 0.0011043998956538792, "epoch": 1.8789485256394596, "percentage": 96.14, "elapsed_time": "1 day, 16:42:45", "remaining_time": "1:38:08", "throughput": 332.15, "total_tokens": 48682400} {"current_steps": 38460, "total_steps": 40000, "loss": 0.0499, "lr": 0.0010972765598410538, "epoch": 1.879192827303154, "percentage": 96.15, "elapsed_time": "1 day, 16:42:49", "remaining_time": "1:37:48", "throughput": 332.19, "total_tokens": 48688576} {"current_steps": 38465, "total_steps": 40000, "loss": 0.0655, "lr": 0.0010901761866993931, "epoch": 1.8794371289668481, "percentage": 96.16, "elapsed_time": "1 day, 16:42:52", "remaining_time": "1:37:29", "throughput": 332.23, "total_tokens": 48694976} {"current_steps": 38470, "total_steps": 40000, "loss": 0.0339, "lr": 0.0010830987773238876, "epoch": 1.8796814306305425, "percentage": 96.17, "elapsed_time": "1 day, 16:42:55", "remaining_time": "1:37:09", "throughput": 332.26, "total_tokens": 48701696} {"current_steps": 38475, "total_steps": 40000, "loss": 0.0545, "lr": 0.0010760443328059644, "epoch": 1.8799257322942369, "percentage": 96.19, "elapsed_time": "1 day, 16:42:58", "remaining_time": "1:36:49", "throughput": 332.3, "total_tokens": 48707872} {"current_steps": 38480, "total_steps": 40000, "loss": 0.0596, "lr": 0.001069012854233503, "epoch": 1.8801700339579313, "percentage": 96.2, "elapsed_time": "1 day, 16:43:01", "remaining_time": "1:36:30", "throughput": 332.34, "total_tokens": 48714304} {"current_steps": 38485, "total_steps": 40000, "loss": 0.0474, "lr": 0.0010620043426908365, "epoch": 1.8804143356216256, "percentage": 96.21, "elapsed_time": "1 day, 16:43:04", "remaining_time": "1:36:10", "throughput": 332.38, "total_tokens": 48721312} {"current_steps": 38490, "total_steps": 40000, "loss": 0.0545, "lr": 0.0010550187992587833, "epoch": 1.88065863728532, "percentage": 96.23, "elapsed_time": "1 day, 16:43:07", "remaining_time": "1:35:50", "throughput": 332.42, "total_tokens": 48727968} {"current_steps": 38495, "total_steps": 40000, "loss": 0.043, "lr": 0.0010480562250145653, "epoch": 1.8809029389490144, "percentage": 96.24, "elapsed_time": "1 day, 16:43:10", "remaining_time": "1:35:31", "throughput": 332.45, "total_tokens": 48734112} {"current_steps": 38500, "total_steps": 40000, "loss": 0.0525, "lr": 0.0010411166210319567, "epoch": 1.8811472406127085, "percentage": 96.25, "elapsed_time": "1 day, 16:43:13", "remaining_time": "1:35:11", "throughput": 332.49, "total_tokens": 48740512} {"current_steps": 38505, "total_steps": 40000, "loss": 0.0596, "lr": 0.0010341999883810848, "epoch": 1.881391542276403, "percentage": 96.26, "elapsed_time": "1 day, 16:43:16", "remaining_time": "1:34:51", "throughput": 332.52, "total_tokens": 48746720} {"current_steps": 38510, "total_steps": 40000, "loss": 0.066, "lr": 0.0010273063281285965, "epoch": 1.881635843940097, "percentage": 96.28, "elapsed_time": "1 day, 16:43:19", "remaining_time": "1:34:32", "throughput": 332.56, "total_tokens": 48753248} {"current_steps": 38515, "total_steps": 40000, "loss": 0.0672, "lr": 0.0010204356413375747, "epoch": 1.8818801456037915, "percentage": 96.29, "elapsed_time": "1 day, 16:43:23", "remaining_time": "1:34:12", "throughput": 332.59, "total_tokens": 48759360} {"current_steps": 38520, "total_steps": 40000, "loss": 0.0381, "lr": 0.001013587929067572, "epoch": 1.8821244472674858, "percentage": 96.3, "elapsed_time": "1 day, 16:43:25", "remaining_time": "1:33:52", "throughput": 332.63, "total_tokens": 48765248} {"current_steps": 38525, "total_steps": 40000, "loss": 0.0311, "lr": 0.00100676319237461, "epoch": 1.8823687489311802, "percentage": 96.31, "elapsed_time": "1 day, 16:43:29", "remaining_time": "1:33:33", "throughput": 332.66, "total_tokens": 48771552} {"current_steps": 38530, "total_steps": 40000, "loss": 0.0577, "lr": 0.0009999614323110972, "epoch": 1.8826130505948746, "percentage": 96.33, "elapsed_time": "1 day, 16:43:32", "remaining_time": "1:33:13", "throughput": 332.7, "total_tokens": 48778304} {"current_steps": 38535, "total_steps": 40000, "loss": 0.0501, "lr": 0.000993182649926011, "epoch": 1.882857352258569, "percentage": 96.34, "elapsed_time": "1 day, 16:43:35", "remaining_time": "1:32:53", "throughput": 332.74, "total_tokens": 48785088} {"current_steps": 38540, "total_steps": 40000, "loss": 0.0603, "lr": 0.000986426846264682, "epoch": 1.8831016539222634, "percentage": 96.35, "elapsed_time": "1 day, 16:43:38", "remaining_time": "1:32:34", "throughput": 332.78, "total_tokens": 48791328} {"current_steps": 38545, "total_steps": 40000, "loss": 0.0618, "lr": 0.00097969402236896, "epoch": 1.8833459555859575, "percentage": 96.36, "elapsed_time": "1 day, 16:43:41", "remaining_time": "1:32:14", "throughput": 332.82, "total_tokens": 48797984} {"current_steps": 38550, "total_steps": 40000, "loss": 0.0599, "lr": 0.0009729841792771143, "epoch": 1.883590257249652, "percentage": 96.38, "elapsed_time": "1 day, 16:43:44", "remaining_time": "1:31:55", "throughput": 332.85, "total_tokens": 48804256} {"current_steps": 38555, "total_steps": 40000, "loss": 0.0813, "lr": 0.0009662973180239176, "epoch": 1.883834558913346, "percentage": 96.39, "elapsed_time": "1 day, 16:43:47", "remaining_time": "1:31:35", "throughput": 332.89, "total_tokens": 48810400} {"current_steps": 38560, "total_steps": 40000, "loss": 0.0537, "lr": 0.0009596334396405448, "epoch": 1.8840788605770404, "percentage": 96.4, "elapsed_time": "1 day, 16:43:50", "remaining_time": "1:31:15", "throughput": 332.92, "total_tokens": 48816512} {"current_steps": 38565, "total_steps": 40000, "loss": 0.0256, "lr": 0.0009529925451546406, "epoch": 1.8843231622407348, "percentage": 96.41, "elapsed_time": "1 day, 16:43:53", "remaining_time": "1:30:56", "throughput": 332.96, "total_tokens": 48822784} {"current_steps": 38570, "total_steps": 40000, "loss": 0.0556, "lr": 0.0009463746355903357, "epoch": 1.8845674639044292, "percentage": 96.43, "elapsed_time": "1 day, 16:43:56", "remaining_time": "1:30:36", "throughput": 332.99, "total_tokens": 48829152} {"current_steps": 38575, "total_steps": 40000, "loss": 0.0547, "lr": 0.0009397797119681971, "epoch": 1.8848117655681236, "percentage": 96.44, "elapsed_time": "1 day, 16:43:59", "remaining_time": "1:30:17", "throughput": 333.03, "total_tokens": 48835616} {"current_steps": 38580, "total_steps": 40000, "loss": 0.0537, "lr": 0.0009332077753052281, "epoch": 1.885056067231818, "percentage": 96.45, "elapsed_time": "1 day, 16:44:02", "remaining_time": "1:29:57", "throughput": 333.07, "total_tokens": 48842080} {"current_steps": 38585, "total_steps": 40000, "loss": 0.0686, "lr": 0.0009266588266149011, "epoch": 1.8853003688955123, "percentage": 96.46, "elapsed_time": "1 day, 16:44:05", "remaining_time": "1:29:37", "throughput": 333.11, "total_tokens": 48848736} {"current_steps": 38590, "total_steps": 40000, "loss": 0.0831, "lr": 0.0009201328669071584, "epoch": 1.8855446705592065, "percentage": 96.47, "elapsed_time": "1 day, 16:44:09", "remaining_time": "1:29:18", "throughput": 333.14, "total_tokens": 48855040} {"current_steps": 38595, "total_steps": 40000, "loss": 0.0513, "lr": 0.0009136298971883949, "epoch": 1.8857889722229009, "percentage": 96.49, "elapsed_time": "1 day, 16:44:12", "remaining_time": "1:28:58", "throughput": 333.18, "total_tokens": 48861440} {"current_steps": 38600, "total_steps": 40000, "loss": 0.0769, "lr": 0.0009071499184614251, "epoch": 1.886033273886595, "percentage": 96.5, "elapsed_time": "1 day, 16:44:15", "remaining_time": "1:28:39", "throughput": 333.22, "total_tokens": 48868096} {"current_steps": 38600, "total_steps": 40000, "eval_loss": 0.06045933812856674, "epoch": 1.886033273886595, "percentage": 96.5, "elapsed_time": "1 day, 16:54:52", "remaining_time": "1:29:02", "throughput": 331.78, "total_tokens": 48868096} {"current_steps": 38605, "total_steps": 40000, "loss": 0.0391, "lr": 0.0009006929317255663, "epoch": 1.8862775755502894, "percentage": 96.51, "elapsed_time": "1 day, 16:54:56", "remaining_time": "1:28:42", "throughput": 331.81, "total_tokens": 48874304} {"current_steps": 38610, "total_steps": 40000, "loss": 0.0426, "lr": 0.0008942589379765387, "epoch": 1.8865218772139838, "percentage": 96.53, "elapsed_time": "1 day, 16:54:59", "remaining_time": "1:28:22", "throughput": 331.84, "total_tokens": 48880352} {"current_steps": 38615, "total_steps": 40000, "loss": 0.0284, "lr": 0.0008878479382065817, "epoch": 1.8867661788776782, "percentage": 96.54, "elapsed_time": "1 day, 16:55:02", "remaining_time": "1:28:03", "throughput": 331.88, "total_tokens": 48886816} {"current_steps": 38620, "total_steps": 40000, "loss": 0.0479, "lr": 0.0008814599334043215, "epoch": 1.8870104805413725, "percentage": 96.55, "elapsed_time": "1 day, 16:55:05", "remaining_time": "1:27:43", "throughput": 331.92, "total_tokens": 48892896} {"current_steps": 38625, "total_steps": 40000, "loss": 0.0492, "lr": 0.0008750949245548866, "epoch": 1.887254782205067, "percentage": 96.56, "elapsed_time": "1 day, 16:55:08", "remaining_time": "1:27:23", "throughput": 331.95, "total_tokens": 48898848} {"current_steps": 38630, "total_steps": 40000, "loss": 0.0896, "lr": 0.0008687529126398252, "epoch": 1.8874990838687613, "percentage": 96.58, "elapsed_time": "1 day, 16:55:11", "remaining_time": "1:27:04", "throughput": 331.98, "total_tokens": 48904928} {"current_steps": 38635, "total_steps": 40000, "loss": 0.0514, "lr": 0.0008624338986371715, "epoch": 1.8877433855324555, "percentage": 96.59, "elapsed_time": "1 day, 16:55:14", "remaining_time": "1:26:44", "throughput": 332.02, "total_tokens": 48911136} {"current_steps": 38640, "total_steps": 40000, "loss": 0.0624, "lr": 0.0008561378835213962, "epoch": 1.8879876871961498, "percentage": 96.6, "elapsed_time": "1 day, 16:55:17", "remaining_time": "1:26:25", "throughput": 332.06, "total_tokens": 48917600} {"current_steps": 38645, "total_steps": 40000, "loss": 0.0625, "lr": 0.0008498648682634058, "epoch": 1.888231988859844, "percentage": 96.61, "elapsed_time": "1 day, 16:55:20", "remaining_time": "1:26:05", "throughput": 332.09, "total_tokens": 48924256} {"current_steps": 38650, "total_steps": 40000, "loss": 0.0468, "lr": 0.0008436148538306099, "epoch": 1.8884762905235384, "percentage": 96.62, "elapsed_time": "1 day, 16:55:24", "remaining_time": "1:25:45", "throughput": 332.13, "total_tokens": 48931360} {"current_steps": 38655, "total_steps": 40000, "loss": 0.0732, "lr": 0.0008373878411868041, "epoch": 1.8887205921872328, "percentage": 96.64, "elapsed_time": "1 day, 16:55:27", "remaining_time": "1:25:26", "throughput": 332.17, "total_tokens": 48937856} {"current_steps": 38660, "total_steps": 40000, "loss": 0.0628, "lr": 0.000831183831292287, "epoch": 1.8889648938509271, "percentage": 96.65, "elapsed_time": "1 day, 16:55:30", "remaining_time": "1:25:06", "throughput": 332.21, "total_tokens": 48944256} {"current_steps": 38665, "total_steps": 40000, "loss": 0.05, "lr": 0.0008250028251037933, "epoch": 1.8892091955146215, "percentage": 96.66, "elapsed_time": "1 day, 16:55:33", "remaining_time": "1:24:47", "throughput": 332.24, "total_tokens": 48950560} {"current_steps": 38670, "total_steps": 40000, "loss": 0.0795, "lr": 0.0008188448235745271, "epoch": 1.889453497178316, "percentage": 96.67, "elapsed_time": "1 day, 16:55:36", "remaining_time": "1:24:27", "throughput": 332.28, "total_tokens": 48956448} {"current_steps": 38675, "total_steps": 40000, "loss": 0.053, "lr": 0.0008127098276541122, "epoch": 1.8896977988420103, "percentage": 96.69, "elapsed_time": "1 day, 16:55:39", "remaining_time": "1:24:07", "throughput": 332.31, "total_tokens": 48962944} {"current_steps": 38680, "total_steps": 40000, "loss": 0.0714, "lr": 0.0008065978382886418, "epoch": 1.8899421005057044, "percentage": 96.7, "elapsed_time": "1 day, 16:55:42", "remaining_time": "1:23:48", "throughput": 332.35, "total_tokens": 48969184} {"current_steps": 38685, "total_steps": 40000, "loss": 0.0873, "lr": 0.0008005088564206785, "epoch": 1.8901864021693988, "percentage": 96.71, "elapsed_time": "1 day, 16:55:45", "remaining_time": "1:23:28", "throughput": 332.38, "total_tokens": 48974816} {"current_steps": 38690, "total_steps": 40000, "loss": 0.0297, "lr": 0.0007944428829891881, "epoch": 1.890430703833093, "percentage": 96.73, "elapsed_time": "1 day, 16:55:48", "remaining_time": "1:23:09", "throughput": 332.43, "total_tokens": 48982464} {"current_steps": 38695, "total_steps": 40000, "loss": 0.0343, "lr": 0.0007883999189296386, "epoch": 1.8906750054967874, "percentage": 96.74, "elapsed_time": "1 day, 16:55:51", "remaining_time": "1:22:49", "throughput": 332.46, "total_tokens": 48989024} {"current_steps": 38700, "total_steps": 40000, "loss": 0.0701, "lr": 0.0007823799651739515, "epoch": 1.8909193071604817, "percentage": 96.75, "elapsed_time": "1 day, 16:55:54", "remaining_time": "1:22:29", "throughput": 332.5, "total_tokens": 48995584} {"current_steps": 38705, "total_steps": 40000, "loss": 0.058, "lr": 0.0007763830226504509, "epoch": 1.8911636088241761, "percentage": 96.76, "elapsed_time": "1 day, 16:55:57", "remaining_time": "1:22:10", "throughput": 332.54, "total_tokens": 49002048} {"current_steps": 38710, "total_steps": 40000, "loss": 0.0856, "lr": 0.0007704090922839468, "epoch": 1.8914079104878705, "percentage": 96.78, "elapsed_time": "1 day, 16:56:01", "remaining_time": "1:21:50", "throughput": 332.57, "total_tokens": 49008256} {"current_steps": 38715, "total_steps": 40000, "loss": 0.0279, "lr": 0.0007644581749957025, "epoch": 1.8916522121515649, "percentage": 96.79, "elapsed_time": "1 day, 16:56:04", "remaining_time": "1:21:31", "throughput": 332.61, "total_tokens": 49014688} {"current_steps": 38720, "total_steps": 40000, "loss": 0.04, "lr": 0.000758530271703417, "epoch": 1.891896513815259, "percentage": 96.8, "elapsed_time": "1 day, 16:56:07", "remaining_time": "1:21:11", "throughput": 332.65, "total_tokens": 49021184} {"current_steps": 38725, "total_steps": 40000, "loss": 0.0416, "lr": 0.0007526253833212426, "epoch": 1.8921408154789534, "percentage": 96.81, "elapsed_time": "1 day, 16:56:10", "remaining_time": "1:20:52", "throughput": 332.68, "total_tokens": 49027840} {"current_steps": 38730, "total_steps": 40000, "loss": 0.0547, "lr": 0.0007467435107598008, "epoch": 1.8923851171426478, "percentage": 96.83, "elapsed_time": "1 day, 16:56:13", "remaining_time": "1:20:32", "throughput": 332.72, "total_tokens": 49034432} {"current_steps": 38735, "total_steps": 40000, "loss": 0.0318, "lr": 0.0007408846549261328, "epoch": 1.892629418806342, "percentage": 96.84, "elapsed_time": "1 day, 16:56:16", "remaining_time": "1:20:13", "throughput": 332.76, "total_tokens": 49040864} {"current_steps": 38740, "total_steps": 40000, "loss": 0.041, "lr": 0.0007350488167237656, "epoch": 1.8928737204700363, "percentage": 96.85, "elapsed_time": "1 day, 16:56:19", "remaining_time": "1:19:53", "throughput": 332.8, "total_tokens": 49047424} {"current_steps": 38745, "total_steps": 40000, "loss": 0.035, "lr": 0.0007292359970526629, "epoch": 1.8931180221337307, "percentage": 96.86, "elapsed_time": "1 day, 16:56:22", "remaining_time": "1:19:33", "throughput": 332.83, "total_tokens": 49053600} {"current_steps": 38750, "total_steps": 40000, "loss": 0.0643, "lr": 0.0007234461968092076, "epoch": 1.893362323797425, "percentage": 96.88, "elapsed_time": "1 day, 16:56:26", "remaining_time": "1:19:14", "throughput": 332.87, "total_tokens": 49060032} {"current_steps": 38755, "total_steps": 40000, "loss": 0.0653, "lr": 0.0007176794168862854, "epoch": 1.8936066254611195, "percentage": 96.89, "elapsed_time": "1 day, 16:56:29", "remaining_time": "1:18:54", "throughput": 332.91, "total_tokens": 49066624} {"current_steps": 38760, "total_steps": 40000, "loss": 0.0547, "lr": 0.000711935658173185, "epoch": 1.8938509271248138, "percentage": 96.9, "elapsed_time": "1 day, 16:56:32", "remaining_time": "1:18:35", "throughput": 332.94, "total_tokens": 49073376} {"current_steps": 38765, "total_steps": 40000, "loss": 0.054, "lr": 0.0007062149215556812, "epoch": 1.894095228788508, "percentage": 96.91, "elapsed_time": "1 day, 16:56:35", "remaining_time": "1:18:15", "throughput": 332.98, "total_tokens": 49079616} {"current_steps": 38770, "total_steps": 40000, "loss": 0.0461, "lr": 0.0007005172079159849, "epoch": 1.8943395304522024, "percentage": 96.92, "elapsed_time": "1 day, 16:56:38", "remaining_time": "1:17:56", "throughput": 333.02, "total_tokens": 49086528} {"current_steps": 38775, "total_steps": 40000, "loss": 0.0464, "lr": 0.0006948425181327267, "epoch": 1.8945838321158968, "percentage": 96.94, "elapsed_time": "1 day, 16:56:41", "remaining_time": "1:17:36", "throughput": 333.06, "total_tokens": 49093152} {"current_steps": 38780, "total_steps": 40000, "loss": 0.0359, "lr": 0.000689190853081073, "epoch": 1.894828133779591, "percentage": 96.95, "elapsed_time": "1 day, 16:56:44", "remaining_time": "1:17:17", "throughput": 333.09, "total_tokens": 49099520} {"current_steps": 38785, "total_steps": 40000, "loss": 0.0496, "lr": 0.000683562213632527, "epoch": 1.8950724354432853, "percentage": 96.96, "elapsed_time": "1 day, 16:56:47", "remaining_time": "1:16:57", "throughput": 333.13, "total_tokens": 49105792} {"current_steps": 38790, "total_steps": 40000, "loss": 0.0512, "lr": 0.0006779566006551108, "epoch": 1.8953167371069797, "percentage": 96.97, "elapsed_time": "1 day, 16:56:50", "remaining_time": "1:16:38", "throughput": 333.17, "total_tokens": 49112352} {"current_steps": 38795, "total_steps": 40000, "loss": 0.0498, "lr": 0.0006723740150132995, "epoch": 1.895561038770674, "percentage": 96.99, "elapsed_time": "1 day, 16:56:53", "remaining_time": "1:16:18", "throughput": 333.2, "total_tokens": 49118848} {"current_steps": 38800, "total_steps": 40000, "loss": 0.0386, "lr": 0.0006668144575679713, "epoch": 1.8958053404343684, "percentage": 97.0, "elapsed_time": "1 day, 16:56:57", "remaining_time": "1:15:59", "throughput": 333.24, "total_tokens": 49125344} {"current_steps": 38800, "total_steps": 40000, "eval_loss": 0.06046942248940468, "epoch": 1.8958053404343684, "percentage": 97.0, "elapsed_time": "1 day, 17:07:34", "remaining_time": "1:16:18", "throughput": 331.81, "total_tokens": 49125344} {"current_steps": 38805, "total_steps": 40000, "loss": 0.0486, "lr": 0.0006612779291765069, "epoch": 1.8960496420980628, "percentage": 97.01, "elapsed_time": "1 day, 17:07:38", "remaining_time": "1:15:59", "throughput": 331.84, "total_tokens": 49131936} {"current_steps": 38810, "total_steps": 40000, "loss": 0.0635, "lr": 0.0006557644306926736, "epoch": 1.896293943761757, "percentage": 97.02, "elapsed_time": "1 day, 17:07:41", "remaining_time": "1:15:39", "throughput": 331.88, "total_tokens": 49138176} {"current_steps": 38815, "total_steps": 40000, "loss": 0.0551, "lr": 0.0006502739629667575, "epoch": 1.8965382454254514, "percentage": 97.04, "elapsed_time": "1 day, 17:07:44", "remaining_time": "1:15:20", "throughput": 331.91, "total_tokens": 49144448} {"current_steps": 38820, "total_steps": 40000, "loss": 0.0604, "lr": 0.0006448065268454317, "epoch": 1.8967825470891457, "percentage": 97.05, "elapsed_time": "1 day, 17:07:47", "remaining_time": "1:15:00", "throughput": 331.95, "total_tokens": 49150816} {"current_steps": 38825, "total_steps": 40000, "loss": 0.0703, "lr": 0.0006393621231718549, "epoch": 1.89702684875284, "percentage": 97.06, "elapsed_time": "1 day, 17:07:50", "remaining_time": "1:14:41", "throughput": 331.99, "total_tokens": 49157120} {"current_steps": 38830, "total_steps": 40000, "loss": 0.0526, "lr": 0.0006339407527856389, "epoch": 1.8972711504165343, "percentage": 97.08, "elapsed_time": "1 day, 17:07:53", "remaining_time": "1:14:21", "throughput": 332.02, "total_tokens": 49163360} {"current_steps": 38835, "total_steps": 40000, "loss": 0.03, "lr": 0.0006285424165227982, "epoch": 1.8975154520802286, "percentage": 97.09, "elapsed_time": "1 day, 17:07:56", "remaining_time": "1:14:02", "throughput": 332.06, "total_tokens": 49170112} {"current_steps": 38840, "total_steps": 40000, "loss": 0.0534, "lr": 0.0006231671152158169, "epoch": 1.897759753743923, "percentage": 97.1, "elapsed_time": "1 day, 17:07:59", "remaining_time": "1:13:42", "throughput": 332.1, "total_tokens": 49177280} {"current_steps": 38845, "total_steps": 40000, "loss": 0.0617, "lr": 0.0006178148496936819, "epoch": 1.8980040554076174, "percentage": 97.11, "elapsed_time": "1 day, 17:08:02", "remaining_time": "1:13:23", "throughput": 332.13, "total_tokens": 49183040} {"current_steps": 38850, "total_steps": 40000, "loss": 0.0403, "lr": 0.000612485620781733, "epoch": 1.8982483570713118, "percentage": 97.12, "elapsed_time": "1 day, 17:08:05", "remaining_time": "1:13:03", "throughput": 332.16, "total_tokens": 49188864} {"current_steps": 38855, "total_steps": 40000, "loss": 0.078, "lr": 0.0006071794293018296, "epoch": 1.898492658735006, "percentage": 97.14, "elapsed_time": "1 day, 17:08:08", "remaining_time": "1:12:43", "throughput": 332.2, "total_tokens": 49195552} {"current_steps": 38860, "total_steps": 40000, "loss": 0.0624, "lr": 0.0006018962760722501, "epoch": 1.8987369603987003, "percentage": 97.15, "elapsed_time": "1 day, 17:08:11", "remaining_time": "1:12:24", "throughput": 332.24, "total_tokens": 49201600} {"current_steps": 38865, "total_steps": 40000, "loss": 0.0604, "lr": 0.0005966361619077098, "epoch": 1.8989812620623945, "percentage": 97.16, "elapsed_time": "1 day, 17:08:14", "remaining_time": "1:12:04", "throughput": 332.27, "total_tokens": 49208128} {"current_steps": 38870, "total_steps": 40000, "loss": 0.051, "lr": 0.000591399087619393, "epoch": 1.8992255637260889, "percentage": 97.17, "elapsed_time": "1 day, 17:08:18", "remaining_time": "1:11:45", "throughput": 332.31, "total_tokens": 49214912} {"current_steps": 38875, "total_steps": 40000, "loss": 0.0713, "lr": 0.0005861850540149371, "epoch": 1.8994698653897832, "percentage": 97.19, "elapsed_time": "1 day, 17:08:21", "remaining_time": "1:11:25", "throughput": 332.35, "total_tokens": 49220896} {"current_steps": 38880, "total_steps": 40000, "loss": 0.0685, "lr": 0.0005809940618983822, "epoch": 1.8997141670534776, "percentage": 97.2, "elapsed_time": "1 day, 17:08:24", "remaining_time": "1:11:06", "throughput": 332.38, "total_tokens": 49227168} {"current_steps": 38885, "total_steps": 40000, "loss": 0.0602, "lr": 0.0005758261120702712, "epoch": 1.899958468717172, "percentage": 97.21, "elapsed_time": "1 day, 17:08:27", "remaining_time": "1:10:46", "throughput": 332.42, "total_tokens": 49234048} {"current_steps": 38890, "total_steps": 40000, "loss": 0.0384, "lr": 0.0005706812053275501, "epoch": 1.9002027703808664, "percentage": 97.22, "elapsed_time": "1 day, 17:08:30", "remaining_time": "1:10:27", "throughput": 332.46, "total_tokens": 49240352} {"current_steps": 38895, "total_steps": 40000, "loss": 0.0417, "lr": 0.0005655593424636173, "epoch": 1.9004470720445608, "percentage": 97.24, "elapsed_time": "1 day, 17:08:33", "remaining_time": "1:10:07", "throughput": 332.49, "total_tokens": 49246944} {"current_steps": 38900, "total_steps": 40000, "loss": 0.0809, "lr": 0.0005604605242683746, "epoch": 1.900691373708255, "percentage": 97.25, "elapsed_time": "1 day, 17:08:36", "remaining_time": "1:09:48", "throughput": 332.53, "total_tokens": 49253664} {"current_steps": 38905, "total_steps": 40000, "loss": 0.0497, "lr": 0.0005553847515280596, "epoch": 1.9009356753719493, "percentage": 97.26, "elapsed_time": "1 day, 17:08:39", "remaining_time": "1:09:28", "throughput": 332.57, "total_tokens": 49260192} {"current_steps": 38910, "total_steps": 40000, "loss": 0.0444, "lr": 0.0005503320250254795, "epoch": 1.9011799770356435, "percentage": 97.28, "elapsed_time": "1 day, 17:08:42", "remaining_time": "1:09:09", "throughput": 332.6, "total_tokens": 49266240} {"current_steps": 38915, "total_steps": 40000, "loss": 0.0547, "lr": 0.0005453023455397943, "epoch": 1.9014242786993378, "percentage": 97.29, "elapsed_time": "1 day, 17:08:45", "remaining_time": "1:08:49", "throughput": 332.64, "total_tokens": 49272832} {"current_steps": 38920, "total_steps": 40000, "loss": 0.0306, "lr": 0.0005402957138466502, "epoch": 1.9016685803630322, "percentage": 97.3, "elapsed_time": "1 day, 17:08:48", "remaining_time": "1:08:30", "throughput": 332.68, "total_tokens": 49279328} {"current_steps": 38925, "total_steps": 40000, "loss": 0.0478, "lr": 0.0005353121307181463, "epoch": 1.9019128820267266, "percentage": 97.31, "elapsed_time": "1 day, 17:08:52", "remaining_time": "1:08:10", "throughput": 332.72, "total_tokens": 49285952} {"current_steps": 38930, "total_steps": 40000, "loss": 0.0442, "lr": 0.0005303515969227845, "epoch": 1.902157183690421, "percentage": 97.32, "elapsed_time": "1 day, 17:08:55", "remaining_time": "1:07:51", "throughput": 332.75, "total_tokens": 49292000} {"current_steps": 38935, "total_steps": 40000, "loss": 0.0631, "lr": 0.0005254141132255862, "epoch": 1.9024014853541154, "percentage": 97.34, "elapsed_time": "1 day, 17:08:58", "remaining_time": "1:07:32", "throughput": 332.79, "total_tokens": 49298432} {"current_steps": 38940, "total_steps": 40000, "loss": 0.0456, "lr": 0.0005204996803879258, "epoch": 1.9026457870178097, "percentage": 97.35, "elapsed_time": "1 day, 17:09:01", "remaining_time": "1:07:12", "throughput": 332.82, "total_tokens": 49304672} {"current_steps": 38945, "total_steps": 40000, "loss": 0.0542, "lr": 0.0005156082991676969, "epoch": 1.9028900886815039, "percentage": 97.36, "elapsed_time": "1 day, 17:09:04", "remaining_time": "1:06:53", "throughput": 332.86, "total_tokens": 49310848} {"current_steps": 38950, "total_steps": 40000, "loss": 0.0452, "lr": 0.0005107399703192127, "epoch": 1.9031343903451983, "percentage": 97.38, "elapsed_time": "1 day, 17:09:07", "remaining_time": "1:06:33", "throughput": 332.89, "total_tokens": 49317216} {"current_steps": 38955, "total_steps": 40000, "loss": 0.0743, "lr": 0.0005058946945932063, "epoch": 1.9033786920088924, "percentage": 97.39, "elapsed_time": "1 day, 17:09:10", "remaining_time": "1:06:14", "throughput": 332.93, "total_tokens": 49323872} {"current_steps": 38960, "total_steps": 40000, "loss": 0.0522, "lr": 0.0005010724727369131, "epoch": 1.9036229936725868, "percentage": 97.4, "elapsed_time": "1 day, 17:09:13", "remaining_time": "1:05:54", "throughput": 332.96, "total_tokens": 49329952} {"current_steps": 38965, "total_steps": 40000, "loss": 0.0469, "lr": 0.000496273305493955, "epoch": 1.9038672953362812, "percentage": 97.41, "elapsed_time": "1 day, 17:09:16", "remaining_time": "1:05:35", "throughput": 333.0, "total_tokens": 49336288} {"current_steps": 38970, "total_steps": 40000, "loss": 0.0573, "lr": 0.0004914971936044399, "epoch": 1.9041115969999756, "percentage": 97.42, "elapsed_time": "1 day, 17:09:19", "remaining_time": "1:05:15", "throughput": 333.03, "total_tokens": 49342144} {"current_steps": 38975, "total_steps": 40000, "loss": 0.0481, "lr": 0.00048674413780491196, "epoch": 1.90435589866367, "percentage": 97.44, "elapsed_time": "1 day, 17:09:22", "remaining_time": "1:04:56", "throughput": 333.07, "total_tokens": 49348480} {"current_steps": 38980, "total_steps": 40000, "loss": 0.0656, "lr": 0.0004820141388283183, "epoch": 1.9046002003273643, "percentage": 97.45, "elapsed_time": "1 day, 17:09:25", "remaining_time": "1:04:37", "throughput": 333.11, "total_tokens": 49354912} {"current_steps": 38985, "total_steps": 40000, "loss": 0.0592, "lr": 0.00047730719740410874, "epoch": 1.9048445019910587, "percentage": 97.46, "elapsed_time": "1 day, 17:09:28", "remaining_time": "1:04:17", "throughput": 333.14, "total_tokens": 49361152} {"current_steps": 38990, "total_steps": 40000, "loss": 0.0473, "lr": 0.00047262331425816927, "epoch": 1.9050888036547529, "percentage": 97.47, "elapsed_time": "1 day, 17:09:31", "remaining_time": "1:03:58", "throughput": 333.18, "total_tokens": 49367328} {"current_steps": 38995, "total_steps": 40000, "loss": 0.0759, "lr": 0.00046796249011277213, "epoch": 1.9053331053184472, "percentage": 97.49, "elapsed_time": "1 day, 17:09:35", "remaining_time": "1:03:38", "throughput": 333.21, "total_tokens": 49373760} {"current_steps": 39000, "total_steps": 40000, "loss": 0.0539, "lr": 0.00046332472568669236, "epoch": 1.9055774069821414, "percentage": 97.5, "elapsed_time": "1 day, 17:09:38", "remaining_time": "1:03:19", "throughput": 333.25, "total_tokens": 49380224} {"current_steps": 39000, "total_steps": 40000, "eval_loss": 0.06053614616394043, "epoch": 1.9055774069821414, "percentage": 97.5, "elapsed_time": "1 day, 17:20:16", "remaining_time": "1:03:35", "throughput": 331.82, "total_tokens": 49380224} {"current_steps": 39005, "total_steps": 40000, "loss": 0.0534, "lr": 0.0004587100216951578, "epoch": 1.9058217086458358, "percentage": 97.51, "elapsed_time": "1 day, 17:20:20", "remaining_time": "1:03:16", "throughput": 331.85, "total_tokens": 49386816} {"current_steps": 39010, "total_steps": 40000, "loss": 0.0865, "lr": 0.00045411837884978265, "epoch": 1.9060660103095302, "percentage": 97.52, "elapsed_time": "1 day, 17:20:23", "remaining_time": "1:02:56", "throughput": 331.89, "total_tokens": 49393312} {"current_steps": 39015, "total_steps": 40000, "loss": 0.0402, "lr": 0.00044954979785865045, "epoch": 1.9063103119732245, "percentage": 97.54, "elapsed_time": "1 day, 17:20:26", "remaining_time": "1:02:37", "throughput": 331.93, "total_tokens": 49399520} {"current_steps": 39020, "total_steps": 40000, "loss": 0.1003, "lr": 0.00044500427942631426, "epoch": 1.906554613636919, "percentage": 97.55, "elapsed_time": "1 day, 17:20:29", "remaining_time": "1:02:17", "throughput": 331.96, "total_tokens": 49405696} {"current_steps": 39025, "total_steps": 40000, "loss": 0.027, "lr": 0.0004404818242537467, "epoch": 1.9067989153006133, "percentage": 97.56, "elapsed_time": "1 day, 17:20:33", "remaining_time": "1:01:58", "throughput": 332.0, "total_tokens": 49412192} {"current_steps": 39030, "total_steps": 40000, "loss": 0.079, "lr": 0.00043598243303837324, "epoch": 1.9070432169643077, "percentage": 97.58, "elapsed_time": "1 day, 17:20:36", "remaining_time": "1:01:38", "throughput": 332.03, "total_tokens": 49418208} {"current_steps": 39035, "total_steps": 40000, "loss": 0.0523, "lr": 0.00043150610647403885, "epoch": 1.9072875186280018, "percentage": 97.59, "elapsed_time": "1 day, 17:20:39", "remaining_time": "1:01:19", "throughput": 332.07, "total_tokens": 49424864} {"current_steps": 39040, "total_steps": 40000, "loss": 0.0273, "lr": 0.00042705284525104134, "epoch": 1.9075318202916962, "percentage": 97.6, "elapsed_time": "1 day, 17:20:42", "remaining_time": "1:01:00", "throughput": 332.11, "total_tokens": 49431360} {"current_steps": 39045, "total_steps": 40000, "loss": 0.0504, "lr": 0.0004226226500561647, "epoch": 1.9077761219553904, "percentage": 97.61, "elapsed_time": "1 day, 17:20:45", "remaining_time": "1:00:40", "throughput": 332.14, "total_tokens": 49437408} {"current_steps": 39050, "total_steps": 40000, "loss": 0.0636, "lr": 0.0004182155215725791, "epoch": 1.9080204236190847, "percentage": 97.62, "elapsed_time": "1 day, 17:20:48", "remaining_time": "1:00:21", "throughput": 332.17, "total_tokens": 49443648} {"current_steps": 39055, "total_steps": 40000, "loss": 0.0643, "lr": 0.00041383146047992424, "epoch": 1.9082647252827791, "percentage": 97.64, "elapsed_time": "1 day, 17:20:51", "remaining_time": "1:00:01", "throughput": 332.21, "total_tokens": 49449568} {"current_steps": 39060, "total_steps": 40000, "loss": 0.0438, "lr": 0.00040947046745427597, "epoch": 1.9085090269464735, "percentage": 97.65, "elapsed_time": "1 day, 17:20:54", "remaining_time": "0:59:42", "throughput": 332.24, "total_tokens": 49455936} {"current_steps": 39065, "total_steps": 40000, "loss": 0.0748, "lr": 0.00040513254316814625, "epoch": 1.9087533286101679, "percentage": 97.66, "elapsed_time": "1 day, 17:20:57", "remaining_time": "0:59:22", "throughput": 332.28, "total_tokens": 49462560} {"current_steps": 39070, "total_steps": 40000, "loss": 0.0362, "lr": 0.0004008176882905168, "epoch": 1.9089976302738623, "percentage": 97.67, "elapsed_time": "1 day, 17:21:00", "remaining_time": "0:59:03", "throughput": 332.31, "total_tokens": 49468512} {"current_steps": 39075, "total_steps": 40000, "loss": 0.0684, "lr": 0.00039652590348677184, "epoch": 1.9092419319375566, "percentage": 97.69, "elapsed_time": "1 day, 17:21:03", "remaining_time": "0:58:43", "throughput": 332.35, "total_tokens": 49474560} {"current_steps": 39080, "total_steps": 40000, "loss": 0.0579, "lr": 0.00039225718941878206, "epoch": 1.9094862336012508, "percentage": 97.7, "elapsed_time": "1 day, 17:21:06", "remaining_time": "0:58:24", "throughput": 332.38, "total_tokens": 49480896} {"current_steps": 39085, "total_steps": 40000, "loss": 0.0737, "lr": 0.00038801154674480417, "epoch": 1.9097305352649452, "percentage": 97.71, "elapsed_time": "1 day, 17:21:09", "remaining_time": "0:58:05", "throughput": 332.42, "total_tokens": 49487616} {"current_steps": 39090, "total_steps": 40000, "loss": 0.068, "lr": 0.00038378897611959784, "epoch": 1.9099748369286393, "percentage": 97.72, "elapsed_time": "1 day, 17:21:12", "remaining_time": "0:57:45", "throughput": 332.46, "total_tokens": 49493824} {"current_steps": 39095, "total_steps": 40000, "loss": 0.0611, "lr": 0.00037958947819430875, "epoch": 1.9102191385923337, "percentage": 97.74, "elapsed_time": "1 day, 17:21:16", "remaining_time": "0:57:26", "throughput": 332.5, "total_tokens": 49500736} {"current_steps": 39100, "total_steps": 40000, "loss": 0.0574, "lr": 0.0003754130536165856, "epoch": 1.910463440256028, "percentage": 97.75, "elapsed_time": "1 day, 17:21:19", "remaining_time": "0:57:06", "throughput": 332.53, "total_tokens": 49507264} {"current_steps": 39105, "total_steps": 40000, "loss": 0.0544, "lr": 0.0003712597030304632, "epoch": 1.9107077419197225, "percentage": 97.76, "elapsed_time": "1 day, 17:21:22", "remaining_time": "0:56:47", "throughput": 332.57, "total_tokens": 49513824} {"current_steps": 39110, "total_steps": 40000, "loss": 0.0336, "lr": 0.00036712942707646247, "epoch": 1.9109520435834169, "percentage": 97.78, "elapsed_time": "1 day, 17:21:25", "remaining_time": "0:56:28", "throughput": 332.61, "total_tokens": 49520640} {"current_steps": 39115, "total_steps": 40000, "loss": 0.0749, "lr": 0.00036302222639149063, "epoch": 1.9111963452471112, "percentage": 97.79, "elapsed_time": "1 day, 17:21:28", "remaining_time": "0:56:08", "throughput": 332.64, "total_tokens": 49526944} {"current_steps": 39120, "total_steps": 40000, "loss": 0.0461, "lr": 0.000358938101608941, "epoch": 1.9114406469108056, "percentage": 97.8, "elapsed_time": "1 day, 17:21:31", "remaining_time": "0:55:49", "throughput": 332.68, "total_tokens": 49532864} {"current_steps": 39125, "total_steps": 40000, "loss": 0.0823, "lr": 0.0003548770533586598, "epoch": 1.9116849485744998, "percentage": 97.81, "elapsed_time": "1 day, 17:21:34", "remaining_time": "0:55:29", "throughput": 332.71, "total_tokens": 49539264} {"current_steps": 39130, "total_steps": 40000, "loss": 0.0757, "lr": 0.0003508390822668961, "epoch": 1.9119292502381942, "percentage": 97.82, "elapsed_time": "1 day, 17:21:37", "remaining_time": "0:55:10", "throughput": 332.75, "total_tokens": 49545472} {"current_steps": 39135, "total_steps": 40000, "loss": 0.0433, "lr": 0.00034682418895633503, "epoch": 1.9121735519018883, "percentage": 97.84, "elapsed_time": "1 day, 17:21:40", "remaining_time": "0:54:51", "throughput": 332.78, "total_tokens": 49551936} {"current_steps": 39140, "total_steps": 40000, "loss": 0.0452, "lr": 0.0003428323740461647, "epoch": 1.9124178535655827, "percentage": 97.85, "elapsed_time": "1 day, 17:21:43", "remaining_time": "0:54:31", "throughput": 332.82, "total_tokens": 49558528} {"current_steps": 39145, "total_steps": 40000, "loss": 0.0792, "lr": 0.00033886363815194276, "epoch": 1.912662155229277, "percentage": 97.86, "elapsed_time": "1 day, 17:21:46", "remaining_time": "0:54:12", "throughput": 332.85, "total_tokens": 49564384} {"current_steps": 39150, "total_steps": 40000, "loss": 0.0669, "lr": 0.0003349179818857129, "epoch": 1.9129064568929715, "percentage": 97.88, "elapsed_time": "1 day, 17:21:49", "remaining_time": "0:53:53", "throughput": 332.89, "total_tokens": 49570528} {"current_steps": 39155, "total_steps": 40000, "loss": 0.0405, "lr": 0.0003309954058559383, "epoch": 1.9131507585566658, "percentage": 97.89, "elapsed_time": "1 day, 17:21:52", "remaining_time": "0:53:33", "throughput": 332.92, "total_tokens": 49576352} {"current_steps": 39160, "total_steps": 40000, "loss": 0.064, "lr": 0.0003270959106675186, "epoch": 1.9133950602203602, "percentage": 97.9, "elapsed_time": "1 day, 17:21:56", "remaining_time": "0:53:14", "throughput": 332.96, "total_tokens": 49582624} {"current_steps": 39165, "total_steps": 40000, "loss": 0.0671, "lr": 0.0003232194969218227, "epoch": 1.9136393618840546, "percentage": 97.91, "elapsed_time": "1 day, 17:21:59", "remaining_time": "0:52:54", "throughput": 332.99, "total_tokens": 49588736} {"current_steps": 39170, "total_steps": 40000, "loss": 0.0442, "lr": 0.00031936616521663905, "epoch": 1.9138836635477487, "percentage": 97.92, "elapsed_time": "1 day, 17:22:02", "remaining_time": "0:52:35", "throughput": 333.03, "total_tokens": 49595040} {"current_steps": 39175, "total_steps": 40000, "loss": 0.0915, "lr": 0.00031553591614619236, "epoch": 1.9141279652114431, "percentage": 97.94, "elapsed_time": "1 day, 17:22:05", "remaining_time": "0:52:16", "throughput": 333.06, "total_tokens": 49601632} {"current_steps": 39180, "total_steps": 40000, "loss": 0.0445, "lr": 0.00031172875030117676, "epoch": 1.9143722668751373, "percentage": 97.95, "elapsed_time": "1 day, 17:22:08", "remaining_time": "0:51:56", "throughput": 333.1, "total_tokens": 49608544} {"current_steps": 39185, "total_steps": 40000, "loss": 0.0663, "lr": 0.0003079446682686726, "epoch": 1.9146165685388317, "percentage": 97.96, "elapsed_time": "1 day, 17:22:11", "remaining_time": "0:51:37", "throughput": 333.14, "total_tokens": 49614720} {"current_steps": 39190, "total_steps": 40000, "loss": 0.0504, "lr": 0.0003041836706322465, "epoch": 1.914860870202526, "percentage": 97.97, "elapsed_time": "1 day, 17:22:14", "remaining_time": "0:51:18", "throughput": 333.17, "total_tokens": 49621088} {"current_steps": 39195, "total_steps": 40000, "loss": 0.0675, "lr": 0.0003004457579719011, "epoch": 1.9151051718662204, "percentage": 97.99, "elapsed_time": "1 day, 17:22:17", "remaining_time": "0:50:58", "throughput": 333.21, "total_tokens": 49627296} {"current_steps": 39200, "total_steps": 40000, "loss": 0.0416, "lr": 0.00029673093086405867, "epoch": 1.9153494735299148, "percentage": 98.0, "elapsed_time": "1 day, 17:22:20", "remaining_time": "0:50:39", "throughput": 333.24, "total_tokens": 49633664} {"current_steps": 39200, "total_steps": 40000, "eval_loss": 0.06052808836102486, "epoch": 1.9153494735299148, "percentage": 98.0, "elapsed_time": "1 day, 17:32:59", "remaining_time": "0:50:52", "throughput": 331.82, "total_tokens": 49633664} {"current_steps": 39205, "total_steps": 40000, "loss": 0.0574, "lr": 0.00029303918988159426, "epoch": 1.9155937751936092, "percentage": 98.01, "elapsed_time": "1 day, 17:33:03", "remaining_time": "0:50:33", "throughput": 331.85, "total_tokens": 49639808} {"current_steps": 39210, "total_steps": 40000, "loss": 0.0444, "lr": 0.0002893705355938192, "epoch": 1.9158380768573036, "percentage": 98.02, "elapsed_time": "1 day, 17:33:06", "remaining_time": "0:50:13", "throughput": 331.89, "total_tokens": 49646272} {"current_steps": 39215, "total_steps": 40000, "loss": 0.0676, "lr": 0.0002857249685664975, "epoch": 1.9160823785209977, "percentage": 98.04, "elapsed_time": "1 day, 17:33:09", "remaining_time": "0:49:54", "throughput": 331.93, "total_tokens": 49652704} {"current_steps": 39220, "total_steps": 40000, "loss": 0.0669, "lr": 0.0002821024893618129, "epoch": 1.916326680184692, "percentage": 98.05, "elapsed_time": "1 day, 17:33:12", "remaining_time": "0:49:35", "throughput": 331.96, "total_tokens": 49658880} {"current_steps": 39225, "total_steps": 40000, "loss": 0.04, "lr": 0.0002785030985383852, "epoch": 1.9165709818483863, "percentage": 98.06, "elapsed_time": "1 day, 17:33:15", "remaining_time": "0:49:15", "throughput": 332.0, "total_tokens": 49665408} {"current_steps": 39230, "total_steps": 40000, "loss": 0.0666, "lr": 0.00027492679665130356, "epoch": 1.9168152835120806, "percentage": 98.08, "elapsed_time": "1 day, 17:33:18", "remaining_time": "0:48:56", "throughput": 332.03, "total_tokens": 49671424} {"current_steps": 39235, "total_steps": 40000, "loss": 0.0552, "lr": 0.000271373584252077, "epoch": 1.917059585175775, "percentage": 98.09, "elapsed_time": "1 day, 17:33:21", "remaining_time": "0:48:36", "throughput": 332.07, "total_tokens": 49677984} {"current_steps": 39240, "total_steps": 40000, "loss": 0.0665, "lr": 0.00026784346188865046, "epoch": 1.9173038868394694, "percentage": 98.1, "elapsed_time": "1 day, 17:33:25", "remaining_time": "0:48:17", "throughput": 332.1, "total_tokens": 49684256} {"current_steps": 39245, "total_steps": 40000, "loss": 0.0759, "lr": 0.0002643364301054218, "epoch": 1.9175481885031638, "percentage": 98.11, "elapsed_time": "1 day, 17:33:28", "remaining_time": "0:47:58", "throughput": 332.14, "total_tokens": 49690592} {"current_steps": 39250, "total_steps": 40000, "loss": 0.0514, "lr": 0.0002608524894431918, "epoch": 1.9177924901668582, "percentage": 98.12, "elapsed_time": "1 day, 17:33:31", "remaining_time": "0:47:38", "throughput": 332.17, "total_tokens": 49696992} {"current_steps": 39255, "total_steps": 40000, "loss": 0.0991, "lr": 0.000257391640439264, "epoch": 1.9180367918305523, "percentage": 98.14, "elapsed_time": "1 day, 17:33:34", "remaining_time": "0:47:19", "throughput": 332.21, "total_tokens": 49703072} {"current_steps": 39260, "total_steps": 40000, "loss": 0.0813, "lr": 0.00025395388362732806, "epoch": 1.9182810934942467, "percentage": 98.15, "elapsed_time": "1 day, 17:33:37", "remaining_time": "0:47:00", "throughput": 332.24, "total_tokens": 49709184} {"current_steps": 39265, "total_steps": 40000, "loss": 0.0535, "lr": 0.00025053921953751, "epoch": 1.918525395157941, "percentage": 98.16, "elapsed_time": "1 day, 17:33:40", "remaining_time": "0:46:40", "throughput": 332.28, "total_tokens": 49715712} {"current_steps": 39270, "total_steps": 40000, "loss": 0.0408, "lr": 0.00024714764869643855, "epoch": 1.9187696968216352, "percentage": 98.17, "elapsed_time": "1 day, 17:33:43", "remaining_time": "0:46:21", "throughput": 332.32, "total_tokens": 49722176} {"current_steps": 39275, "total_steps": 40000, "loss": 0.0708, "lr": 0.0002437791716270954, "epoch": 1.9190139984853296, "percentage": 98.19, "elapsed_time": "1 day, 17:33:46", "remaining_time": "0:46:02", "throughput": 332.35, "total_tokens": 49728576} {"current_steps": 39280, "total_steps": 40000, "loss": 0.0683, "lr": 0.00024043378884896493, "epoch": 1.919258300149024, "percentage": 98.2, "elapsed_time": "1 day, 17:33:49", "remaining_time": "0:45:42", "throughput": 332.39, "total_tokens": 49735136} {"current_steps": 39285, "total_steps": 40000, "loss": 0.0663, "lr": 0.00023711150087793453, "epoch": 1.9195026018127184, "percentage": 98.21, "elapsed_time": "1 day, 17:33:52", "remaining_time": "0:45:23", "throughput": 332.42, "total_tokens": 49741120} {"current_steps": 39290, "total_steps": 40000, "loss": 0.0414, "lr": 0.000233812308226361, "epoch": 1.9197469034764127, "percentage": 98.22, "elapsed_time": "1 day, 17:33:55", "remaining_time": "0:45:04", "throughput": 332.46, "total_tokens": 49747360} {"current_steps": 39295, "total_steps": 40000, "loss": 0.0628, "lr": 0.00023053621140300406, "epoch": 1.9199912051401071, "percentage": 98.24, "elapsed_time": "1 day, 17:33:58", "remaining_time": "0:44:44", "throughput": 332.49, "total_tokens": 49753600} {"current_steps": 39300, "total_steps": 40000, "loss": 0.0608, "lr": 0.00022728321091307623, "epoch": 1.9202355068038013, "percentage": 98.25, "elapsed_time": "1 day, 17:34:02", "remaining_time": "0:44:25", "throughput": 332.53, "total_tokens": 49760256} {"current_steps": 39305, "total_steps": 40000, "loss": 0.0444, "lr": 0.0002240533072582429, "epoch": 1.9204798084674957, "percentage": 98.26, "elapsed_time": "1 day, 17:34:05", "remaining_time": "0:44:06", "throughput": 332.57, "total_tokens": 49766912} {"current_steps": 39310, "total_steps": 40000, "loss": 0.0497, "lr": 0.00022084650093658897, "epoch": 1.92072411013119, "percentage": 98.28, "elapsed_time": "1 day, 17:34:08", "remaining_time": "0:43:46", "throughput": 332.6, "total_tokens": 49773568} {"current_steps": 39315, "total_steps": 40000, "loss": 0.0411, "lr": 0.0002176627924426522, "epoch": 1.9209684117948842, "percentage": 98.29, "elapsed_time": "1 day, 17:34:11", "remaining_time": "0:43:27", "throughput": 332.64, "total_tokens": 49779456} {"current_steps": 39320, "total_steps": 40000, "loss": 0.0681, "lr": 0.0002145021822673898, "epoch": 1.9212127134585786, "percentage": 98.3, "elapsed_time": "1 day, 17:34:14", "remaining_time": "0:43:08", "throughput": 332.67, "total_tokens": 49786080} {"current_steps": 39325, "total_steps": 40000, "loss": 0.06, "lr": 0.00021136467089822862, "epoch": 1.921457015122273, "percentage": 98.31, "elapsed_time": "1 day, 17:34:17", "remaining_time": "0:42:48", "throughput": 332.71, "total_tokens": 49792256} {"current_steps": 39330, "total_steps": 40000, "loss": 0.0641, "lr": 0.00020825025881898162, "epoch": 1.9217013167859673, "percentage": 98.32, "elapsed_time": "1 day, 17:34:20", "remaining_time": "0:42:29", "throughput": 332.74, "total_tokens": 49798336} {"current_steps": 39335, "total_steps": 40000, "loss": 0.048, "lr": 0.0002051589465099479, "epoch": 1.9219456184496617, "percentage": 98.34, "elapsed_time": "1 day, 17:34:23", "remaining_time": "0:42:10", "throughput": 332.78, "total_tokens": 49804864} {"current_steps": 39340, "total_steps": 40000, "loss": 0.0286, "lr": 0.0002020907344478462, "epoch": 1.922189920113356, "percentage": 98.35, "elapsed_time": "1 day, 17:34:26", "remaining_time": "0:41:50", "throughput": 332.81, "total_tokens": 49810848} {"current_steps": 39345, "total_steps": 40000, "loss": 0.0782, "lr": 0.0001990456231058313, "epoch": 1.9224342217770503, "percentage": 98.36, "elapsed_time": "1 day, 17:34:29", "remaining_time": "0:41:31", "throughput": 332.85, "total_tokens": 49817056} {"current_steps": 39350, "total_steps": 40000, "loss": 0.0288, "lr": 0.00019602361295349423, "epoch": 1.9226785234407446, "percentage": 98.38, "elapsed_time": "1 day, 17:34:32", "remaining_time": "0:41:12", "throughput": 332.88, "total_tokens": 49823488} {"current_steps": 39355, "total_steps": 40000, "loss": 0.0474, "lr": 0.0001930247044568789, "epoch": 1.922922825104439, "percentage": 98.39, "elapsed_time": "1 day, 17:34:35", "remaining_time": "0:40:53", "throughput": 332.92, "total_tokens": 49829760} {"current_steps": 39360, "total_steps": 40000, "loss": 0.0315, "lr": 0.00019004889807843205, "epoch": 1.9231671267681332, "percentage": 98.4, "elapsed_time": "1 day, 17:34:39", "remaining_time": "0:40:33", "throughput": 332.96, "total_tokens": 49836800} {"current_steps": 39365, "total_steps": 40000, "loss": 0.0587, "lr": 0.00018709619427708656, "epoch": 1.9234114284318276, "percentage": 98.41, "elapsed_time": "1 day, 17:34:42", "remaining_time": "0:40:14", "throughput": 332.99, "total_tokens": 49842816} {"current_steps": 39370, "total_steps": 40000, "loss": 0.0492, "lr": 0.00018416659350817822, "epoch": 1.923655730095522, "percentage": 98.42, "elapsed_time": "1 day, 17:34:45", "remaining_time": "0:39:55", "throughput": 333.03, "total_tokens": 49849024} {"current_steps": 39375, "total_steps": 40000, "loss": 0.0543, "lr": 0.00018126009622346229, "epoch": 1.9239000317592163, "percentage": 98.44, "elapsed_time": "1 day, 17:34:48", "remaining_time": "0:39:36", "throughput": 333.06, "total_tokens": 49855008} {"current_steps": 39380, "total_steps": 40000, "loss": 0.0473, "lr": 0.00017837670287119687, "epoch": 1.9241443334229107, "percentage": 98.45, "elapsed_time": "1 day, 17:34:51", "remaining_time": "0:39:16", "throughput": 333.1, "total_tokens": 49861568} {"current_steps": 39385, "total_steps": 40000, "loss": 0.0442, "lr": 0.00017551641389602633, "epoch": 1.924388635086605, "percentage": 98.46, "elapsed_time": "1 day, 17:34:54", "remaining_time": "0:38:57", "throughput": 333.13, "total_tokens": 49867808} {"current_steps": 39390, "total_steps": 40000, "loss": 0.0674, "lr": 0.00017267922973903115, "epoch": 1.9246329367502992, "percentage": 98.47, "elapsed_time": "1 day, 17:34:57", "remaining_time": "0:38:38", "throughput": 333.17, "total_tokens": 49874144} {"current_steps": 39395, "total_steps": 40000, "loss": 0.0469, "lr": 0.00016986515083774467, "epoch": 1.9248772384139936, "percentage": 98.49, "elapsed_time": "1 day, 17:35:00", "remaining_time": "0:38:18", "throughput": 333.2, "total_tokens": 49880672} {"current_steps": 39400, "total_steps": 40000, "loss": 0.057, "lr": 0.00016707417762611975, "epoch": 1.9251215400776878, "percentage": 98.5, "elapsed_time": "1 day, 17:35:03", "remaining_time": "0:37:59", "throughput": 333.24, "total_tokens": 49887680} {"current_steps": 39400, "total_steps": 40000, "eval_loss": 0.06055303290486336, "epoch": 1.9251215400776878, "percentage": 98.5, "elapsed_time": "1 day, 17:45:42", "remaining_time": "0:38:09", "throughput": 331.83, "total_tokens": 49887680} {"current_steps": 39405, "total_steps": 40000, "loss": 0.0721, "lr": 0.00016430631053459543, "epoch": 1.9253658417413821, "percentage": 98.51, "elapsed_time": "1 day, 17:45:47", "remaining_time": "0:37:50", "throughput": 331.86, "total_tokens": 49893952} {"current_steps": 39410, "total_steps": 40000, "loss": 0.0253, "lr": 0.0001615615499899803, "epoch": 1.9256101434050765, "percentage": 98.52, "elapsed_time": "1 day, 17:45:50", "remaining_time": "0:37:30", "throughput": 331.89, "total_tokens": 49900128} {"current_steps": 39415, "total_steps": 40000, "loss": 0.0555, "lr": 0.00015883989641556905, "epoch": 1.925854445068771, "percentage": 98.54, "elapsed_time": "1 day, 17:45:53", "remaining_time": "0:37:11", "throughput": 331.93, "total_tokens": 49906368} {"current_steps": 39420, "total_steps": 40000, "loss": 0.0383, "lr": 0.00015614135023105934, "epoch": 1.9260987467324653, "percentage": 98.55, "elapsed_time": "1 day, 17:45:57", "remaining_time": "0:36:52", "throughput": 331.96, "total_tokens": 49912512} {"current_steps": 39425, "total_steps": 40000, "loss": 0.069, "lr": 0.00015346591185261827, "epoch": 1.9263430483961597, "percentage": 98.56, "elapsed_time": "1 day, 17:46:00", "remaining_time": "0:36:32", "throughput": 331.99, "total_tokens": 49918784} {"current_steps": 39430, "total_steps": 40000, "loss": 0.0332, "lr": 0.00015081358169281576, "epoch": 1.926587350059854, "percentage": 98.58, "elapsed_time": "1 day, 17:46:03", "remaining_time": "0:36:13", "throughput": 332.03, "total_tokens": 49925216} {"current_steps": 39435, "total_steps": 40000, "loss": 0.0267, "lr": 0.00014818436016069135, "epoch": 1.9268316517235482, "percentage": 98.59, "elapsed_time": "1 day, 17:46:06", "remaining_time": "0:35:54", "throughput": 332.06, "total_tokens": 49931328} {"current_steps": 39440, "total_steps": 40000, "loss": 0.0525, "lr": 0.00014557824766168735, "epoch": 1.9270759533872426, "percentage": 98.6, "elapsed_time": "1 day, 17:46:09", "remaining_time": "0:35:35", "throughput": 332.1, "total_tokens": 49937600} {"current_steps": 39445, "total_steps": 40000, "loss": 0.0436, "lr": 0.00014299524459769896, "epoch": 1.9273202550509367, "percentage": 98.61, "elapsed_time": "1 day, 17:46:12", "remaining_time": "0:35:15", "throughput": 332.14, "total_tokens": 49944096} {"current_steps": 39450, "total_steps": 40000, "loss": 0.0807, "lr": 0.0001404353513670742, "epoch": 1.9275645567146311, "percentage": 98.62, "elapsed_time": "1 day, 17:46:15", "remaining_time": "0:34:56", "throughput": 332.17, "total_tokens": 49950528} {"current_steps": 39455, "total_steps": 40000, "loss": 0.0505, "lr": 0.0001378985683645806, "epoch": 1.9278088583783255, "percentage": 98.64, "elapsed_time": "1 day, 17:46:18", "remaining_time": "0:34:37", "throughput": 332.21, "total_tokens": 49956768} {"current_steps": 39460, "total_steps": 40000, "loss": 0.0401, "lr": 0.0001353848959813886, "epoch": 1.9280531600420199, "percentage": 98.65, "elapsed_time": "1 day, 17:46:21", "remaining_time": "0:34:17", "throughput": 332.24, "total_tokens": 49963424} {"current_steps": 39465, "total_steps": 40000, "loss": 0.0444, "lr": 0.00013289433460517142, "epoch": 1.9282974617057143, "percentage": 98.66, "elapsed_time": "1 day, 17:46:24", "remaining_time": "0:33:58", "throughput": 332.28, "total_tokens": 49969696} {"current_steps": 39470, "total_steps": 40000, "loss": 0.0595, "lr": 0.00013042688462000518, "epoch": 1.9285417633694086, "percentage": 98.67, "elapsed_time": "1 day, 17:46:27", "remaining_time": "0:33:39", "throughput": 332.31, "total_tokens": 49976128} {"current_steps": 39475, "total_steps": 40000, "loss": 0.0712, "lr": 0.0001279825464063855, "epoch": 1.928786065033103, "percentage": 98.69, "elapsed_time": "1 day, 17:46:30", "remaining_time": "0:33:20", "throughput": 332.35, "total_tokens": 49982496} {"current_steps": 39480, "total_steps": 40000, "loss": 0.0531, "lr": 0.00012556132034126087, "epoch": 1.9290303666967972, "percentage": 98.7, "elapsed_time": "1 day, 17:46:33", "remaining_time": "0:33:00", "throughput": 332.39, "total_tokens": 49988800} {"current_steps": 39485, "total_steps": 40000, "loss": 0.0444, "lr": 0.0001231632067980326, "epoch": 1.9292746683604916, "percentage": 98.71, "elapsed_time": "1 day, 17:46:37", "remaining_time": "0:32:41", "throughput": 332.42, "total_tokens": 49995328} {"current_steps": 39490, "total_steps": 40000, "loss": 0.0564, "lr": 0.00012078820614650486, "epoch": 1.9295189700241857, "percentage": 98.72, "elapsed_time": "1 day, 17:46:40", "remaining_time": "0:32:22", "throughput": 332.46, "total_tokens": 50001568} {"current_steps": 39495, "total_steps": 40000, "loss": 0.0617, "lr": 0.00011843631875291804, "epoch": 1.92976327168788, "percentage": 98.74, "elapsed_time": "1 day, 17:46:43", "remaining_time": "0:32:03", "throughput": 332.49, "total_tokens": 50007840} {"current_steps": 39500, "total_steps": 40000, "loss": 0.0701, "lr": 0.00011610754497999863, "epoch": 1.9300075733515745, "percentage": 98.75, "elapsed_time": "1 day, 17:46:46", "remaining_time": "0:31:43", "throughput": 332.53, "total_tokens": 50014208} {"current_steps": 39505, "total_steps": 40000, "loss": 0.0402, "lr": 0.0001138018851868594, "epoch": 1.9302518750152688, "percentage": 98.76, "elapsed_time": "1 day, 17:46:49", "remaining_time": "0:31:24", "throughput": 332.56, "total_tokens": 50020224} {"current_steps": 39510, "total_steps": 40000, "loss": 0.0696, "lr": 0.0001115193397290326, "epoch": 1.9304961766789632, "percentage": 98.78, "elapsed_time": "1 day, 17:46:52", "remaining_time": "0:31:05", "throughput": 332.59, "total_tokens": 50026400} {"current_steps": 39515, "total_steps": 40000, "loss": 0.0699, "lr": 0.00010925990895856996, "epoch": 1.9307404783426576, "percentage": 98.79, "elapsed_time": "1 day, 17:46:55", "remaining_time": "0:30:46", "throughput": 332.63, "total_tokens": 50032160} {"current_steps": 39520, "total_steps": 40000, "loss": 0.0475, "lr": 0.00010702359322385946, "epoch": 1.930984780006352, "percentage": 98.8, "elapsed_time": "1 day, 17:46:58", "remaining_time": "0:30:26", "throughput": 332.66, "total_tokens": 50038240} {"current_steps": 39525, "total_steps": 40000, "loss": 0.0577, "lr": 0.00010481039286977523, "epoch": 1.9312290816700461, "percentage": 98.81, "elapsed_time": "1 day, 17:47:01", "remaining_time": "0:30:07", "throughput": 332.7, "total_tokens": 50044672} {"current_steps": 39530, "total_steps": 40000, "loss": 0.0536, "lr": 0.00010262030823764423, "epoch": 1.9314733833337405, "percentage": 98.83, "elapsed_time": "1 day, 17:47:04", "remaining_time": "0:29:48", "throughput": 332.73, "total_tokens": 50051520} {"current_steps": 39535, "total_steps": 40000, "loss": 0.064, "lr": 0.00010045333966517966, "epoch": 1.9317176849974347, "percentage": 98.84, "elapsed_time": "1 day, 17:47:07", "remaining_time": "0:29:29", "throughput": 332.77, "total_tokens": 50057824} {"current_steps": 39540, "total_steps": 40000, "loss": 0.052, "lr": 9.83094874865642e-05, "epoch": 1.931961986661129, "percentage": 98.85, "elapsed_time": "1 day, 17:47:10", "remaining_time": "0:29:10", "throughput": 332.81, "total_tokens": 50064448} {"current_steps": 39545, "total_steps": 40000, "loss": 0.0319, "lr": 9.618875203241672e-05, "epoch": 1.9322062883248234, "percentage": 98.86, "elapsed_time": "1 day, 17:47:14", "remaining_time": "0:28:50", "throughput": 332.84, "total_tokens": 50071232} {"current_steps": 39550, "total_steps": 40000, "loss": 0.0464, "lr": 9.409113362977561e-05, "epoch": 1.9324505899885178, "percentage": 98.88, "elapsed_time": "1 day, 17:47:17", "remaining_time": "0:28:31", "throughput": 332.88, "total_tokens": 50077152} {"current_steps": 39555, "total_steps": 40000, "loss": 0.0318, "lr": 9.20166326020988e-05, "epoch": 1.9326948916522122, "percentage": 98.89, "elapsed_time": "1 day, 17:47:20", "remaining_time": "0:28:12", "throughput": 332.91, "total_tokens": 50083584} {"current_steps": 39560, "total_steps": 40000, "loss": 0.0618, "lr": 8.996524926933035e-05, "epoch": 1.9329391933159066, "percentage": 98.9, "elapsed_time": "1 day, 17:47:23", "remaining_time": "0:27:53", "throughput": 332.95, "total_tokens": 50090304} {"current_steps": 39565, "total_steps": 40000, "loss": 0.0285, "lr": 8.793698394781723e-05, "epoch": 1.933183494979601, "percentage": 98.91, "elapsed_time": "1 day, 17:47:26", "remaining_time": "0:27:34", "throughput": 332.98, "total_tokens": 50096320} {"current_steps": 39570, "total_steps": 40000, "loss": 0.08, "lr": 8.593183695030926e-05, "epoch": 1.9334277966432951, "percentage": 98.92, "elapsed_time": "1 day, 17:47:29", "remaining_time": "0:27:14", "throughput": 333.02, "total_tokens": 50102528} {"current_steps": 39575, "total_steps": 40000, "loss": 0.0659, "lr": 8.39498085860757e-05, "epoch": 1.9336720983069895, "percentage": 98.94, "elapsed_time": "1 day, 17:47:32", "remaining_time": "0:26:55", "throughput": 333.05, "total_tokens": 50108864} {"current_steps": 39580, "total_steps": 40000, "loss": 0.0558, "lr": 8.199089916072211e-05, "epoch": 1.9339163999706837, "percentage": 98.95, "elapsed_time": "1 day, 17:47:35", "remaining_time": "0:26:36", "throughput": 333.09, "total_tokens": 50114880} {"current_steps": 39585, "total_steps": 40000, "loss": 0.0735, "lr": 8.005510897637346e-05, "epoch": 1.934160701634378, "percentage": 98.96, "elapsed_time": "1 day, 17:47:38", "remaining_time": "0:26:17", "throughput": 333.12, "total_tokens": 50120800} {"current_steps": 39590, "total_steps": 40000, "loss": 0.042, "lr": 7.8142438331541e-05, "epoch": 1.9344050032980724, "percentage": 98.98, "elapsed_time": "1 day, 17:47:41", "remaining_time": "0:25:58", "throughput": 333.16, "total_tokens": 50127040} {"current_steps": 39595, "total_steps": 40000, "loss": 0.0455, "lr": 7.625288752117209e-05, "epoch": 1.9346493049617668, "percentage": 98.99, "elapsed_time": "1 day, 17:47:44", "remaining_time": "0:25:39", "throughput": 333.19, "total_tokens": 50132864} {"current_steps": 39600, "total_steps": 40000, "loss": 0.0431, "lr": 7.4386456836667e-05, "epoch": 1.9348936066254612, "percentage": 99.0, "elapsed_time": "1 day, 17:47:47", "remaining_time": "0:25:19", "throughput": 333.22, "total_tokens": 50139296} {"current_steps": 39600, "total_steps": 40000, "eval_loss": 0.06054786220192909, "epoch": 1.9348936066254612, "percentage": 99.0, "elapsed_time": "1 day, 17:58:25", "remaining_time": "0:25:26", "throughput": 331.82, "total_tokens": 50139296} {"current_steps": 39605, "total_steps": 40000, "loss": 0.0499, "lr": 7.254314656586214e-05, "epoch": 1.9351379082891556, "percentage": 99.01, "elapsed_time": "1 day, 17:58:29", "remaining_time": "0:25:07", "throughput": 331.85, "total_tokens": 50145760} {"current_steps": 39610, "total_steps": 40000, "loss": 0.0303, "lr": 7.07229569929968e-05, "epoch": 1.93538220995285, "percentage": 99.02, "elapsed_time": "1 day, 17:58:32", "remaining_time": "0:24:47", "throughput": 331.89, "total_tokens": 50152448} {"current_steps": 39615, "total_steps": 40000, "loss": 0.0502, "lr": 6.892588839879643e-05, "epoch": 1.935626511616544, "percentage": 99.04, "elapsed_time": "1 day, 17:58:35", "remaining_time": "0:24:28", "throughput": 331.92, "total_tokens": 50158400} {"current_steps": 39620, "total_steps": 40000, "loss": 0.0579, "lr": 6.71519410603727e-05, "epoch": 1.9358708132802385, "percentage": 99.05, "elapsed_time": "1 day, 17:58:38", "remaining_time": "0:24:09", "throughput": 331.96, "total_tokens": 50165184} {"current_steps": 39625, "total_steps": 40000, "loss": 0.0964, "lr": 6.540111525129011e-05, "epoch": 1.9361151149439326, "percentage": 99.06, "elapsed_time": "1 day, 17:58:41", "remaining_time": "0:23:50", "throughput": 331.99, "total_tokens": 50171360} {"current_steps": 39630, "total_steps": 40000, "loss": 0.0693, "lr": 6.367341124154934e-05, "epoch": 1.936359416607627, "percentage": 99.08, "elapsed_time": "1 day, 17:58:44", "remaining_time": "0:23:30", "throughput": 332.03, "total_tokens": 50177760} {"current_steps": 39635, "total_steps": 40000, "loss": 0.0293, "lr": 6.19688292975873e-05, "epoch": 1.9366037182713214, "percentage": 99.09, "elapsed_time": "1 day, 17:58:48", "remaining_time": "0:23:11", "throughput": 332.06, "total_tokens": 50184160} {"current_steps": 39640, "total_steps": 40000, "loss": 0.0525, "lr": 6.0287369682260336e-05, "epoch": 1.9368480199350158, "percentage": 99.1, "elapsed_time": "1 day, 17:58:51", "remaining_time": "0:22:52", "throughput": 332.1, "total_tokens": 50190176} {"current_steps": 39645, "total_steps": 40000, "loss": 0.0658, "lr": 5.8629032654894384e-05, "epoch": 1.9370923215987101, "percentage": 99.11, "elapsed_time": "1 day, 17:58:54", "remaining_time": "0:22:33", "throughput": 332.13, "total_tokens": 50196160} {"current_steps": 39650, "total_steps": 40000, "loss": 0.0621, "lr": 5.699381847120155e-05, "epoch": 1.9373366232624045, "percentage": 99.12, "elapsed_time": "1 day, 17:58:57", "remaining_time": "0:22:14", "throughput": 332.16, "total_tokens": 50201888} {"current_steps": 39655, "total_steps": 40000, "loss": 0.0548, "lr": 5.5381727383380094e-05, "epoch": 1.937580924926099, "percentage": 99.14, "elapsed_time": "1 day, 17:59:00", "remaining_time": "0:21:54", "throughput": 332.19, "total_tokens": 50207776} {"current_steps": 39660, "total_steps": 40000, "loss": 0.0747, "lr": 5.379275964001451e-05, "epoch": 1.937825226589793, "percentage": 99.15, "elapsed_time": "1 day, 17:59:03", "remaining_time": "0:21:35", "throughput": 332.23, "total_tokens": 50214752} {"current_steps": 39665, "total_steps": 40000, "loss": 0.0597, "lr": 5.222691548614211e-05, "epoch": 1.9380695282534874, "percentage": 99.16, "elapsed_time": "1 day, 17:59:06", "remaining_time": "0:21:16", "throughput": 332.27, "total_tokens": 50221312} {"current_steps": 39670, "total_steps": 40000, "loss": 0.0733, "lr": 5.068419516323641e-05, "epoch": 1.9383138299171816, "percentage": 99.17, "elapsed_time": "1 day, 17:59:09", "remaining_time": "0:20:57", "throughput": 332.31, "total_tokens": 50227680} {"current_steps": 39675, "total_steps": 40000, "loss": 0.0633, "lr": 4.91645989092071e-05, "epoch": 1.938558131580876, "percentage": 99.19, "elapsed_time": "1 day, 17:59:12", "remaining_time": "0:20:38", "throughput": 332.34, "total_tokens": 50234080} {"current_steps": 39680, "total_steps": 40000, "loss": 0.0582, "lr": 4.7668126958400056e-05, "epoch": 1.9388024332445704, "percentage": 99.2, "elapsed_time": "1 day, 17:59:15", "remaining_time": "0:20:18", "throughput": 332.38, "total_tokens": 50240704} {"current_steps": 39685, "total_steps": 40000, "loss": 0.0406, "lr": 4.619477954159734e-05, "epoch": 1.9390467349082647, "percentage": 99.21, "elapsed_time": "1 day, 17:59:18", "remaining_time": "0:19:59", "throughput": 332.41, "total_tokens": 50246560} {"current_steps": 39690, "total_steps": 40000, "loss": 0.0301, "lr": 4.4744556885983884e-05, "epoch": 1.9392910365719591, "percentage": 99.22, "elapsed_time": "1 day, 17:59:21", "remaining_time": "0:19:40", "throughput": 332.45, "total_tokens": 50253152} {"current_steps": 39695, "total_steps": 40000, "loss": 0.0448, "lr": 4.331745921523078e-05, "epoch": 1.9395353382356535, "percentage": 99.24, "elapsed_time": "1 day, 17:59:24", "remaining_time": "0:19:21", "throughput": 332.48, "total_tokens": 50259872} {"current_steps": 39700, "total_steps": 40000, "loss": 0.0394, "lr": 4.191348674937867e-05, "epoch": 1.9397796398993479, "percentage": 99.25, "elapsed_time": "1 day, 17:59:28", "remaining_time": "0:19:02", "throughput": 332.52, "total_tokens": 50266432} {"current_steps": 39705, "total_steps": 40000, "loss": 0.0503, "lr": 4.0532639704971006e-05, "epoch": 1.940023941563042, "percentage": 99.26, "elapsed_time": "1 day, 17:59:31", "remaining_time": "0:18:43", "throughput": 332.56, "total_tokens": 50273376} {"current_steps": 39710, "total_steps": 40000, "loss": 0.0389, "lr": 3.917491829493747e-05, "epoch": 1.9402682432267364, "percentage": 99.28, "elapsed_time": "1 day, 17:59:34", "remaining_time": "0:18:24", "throughput": 332.59, "total_tokens": 50279520} {"current_steps": 39715, "total_steps": 40000, "loss": 0.075, "lr": 3.78403227286439e-05, "epoch": 1.9405125448904306, "percentage": 99.29, "elapsed_time": "1 day, 17:59:37", "remaining_time": "0:18:04", "throughput": 332.63, "total_tokens": 50285600} {"current_steps": 39720, "total_steps": 40000, "loss": 0.0588, "lr": 3.652885321192567e-05, "epoch": 1.940756846554125, "percentage": 99.3, "elapsed_time": "1 day, 17:59:40", "remaining_time": "0:17:45", "throughput": 332.66, "total_tokens": 50291584} {"current_steps": 39725, "total_steps": 40000, "loss": 0.0494, "lr": 3.524050994702099e-05, "epoch": 1.9410011482178193, "percentage": 99.31, "elapsed_time": "1 day, 17:59:43", "remaining_time": "0:17:26", "throughput": 332.7, "total_tokens": 50297984} {"current_steps": 39730, "total_steps": 40000, "loss": 0.0543, "lr": 3.3975293132604276e-05, "epoch": 1.9412454498815137, "percentage": 99.33, "elapsed_time": "1 day, 17:59:46", "remaining_time": "0:17:07", "throughput": 332.73, "total_tokens": 50303904} {"current_steps": 39735, "total_steps": 40000, "loss": 0.0437, "lr": 3.2733202963786125e-05, "epoch": 1.941489751545208, "percentage": 99.34, "elapsed_time": "1 day, 17:59:49", "remaining_time": "0:16:48", "throughput": 332.76, "total_tokens": 50310368} {"current_steps": 39740, "total_steps": 40000, "loss": 0.0633, "lr": 3.15142396321133e-05, "epoch": 1.9417340532089025, "percentage": 99.35, "elapsed_time": "1 day, 17:59:52", "remaining_time": "0:16:29", "throughput": 332.8, "total_tokens": 50316384} {"current_steps": 39745, "total_steps": 40000, "loss": 0.0544, "lr": 3.0318403325552132e-05, "epoch": 1.9419783548725968, "percentage": 99.36, "elapsed_time": "1 day, 17:59:55", "remaining_time": "0:16:10", "throughput": 332.83, "total_tokens": 50322784} {"current_steps": 39750, "total_steps": 40000, "loss": 0.0591, "lr": 2.914569422855506e-05, "epoch": 1.942222656536291, "percentage": 99.38, "elapsed_time": "1 day, 17:59:58", "remaining_time": "0:15:50", "throughput": 332.87, "total_tokens": 50328960} {"current_steps": 39755, "total_steps": 40000, "loss": 0.0549, "lr": 2.7996112521927462e-05, "epoch": 1.9424669581999854, "percentage": 99.39, "elapsed_time": "1 day, 18:00:01", "remaining_time": "0:15:31", "throughput": 332.9, "total_tokens": 50335232} {"current_steps": 39760, "total_steps": 40000, "loss": 0.0785, "lr": 2.68696583829775e-05, "epoch": 1.9427112598636795, "percentage": 99.4, "elapsed_time": "1 day, 18:00:04", "remaining_time": "0:15:12", "throughput": 332.93, "total_tokens": 50341184} {"current_steps": 39765, "total_steps": 40000, "loss": 0.0644, "lr": 2.576633198539957e-05, "epoch": 1.942955561527374, "percentage": 99.41, "elapsed_time": "1 day, 18:00:07", "remaining_time": "0:14:53", "throughput": 332.97, "total_tokens": 50347296} {"current_steps": 39770, "total_steps": 40000, "loss": 0.0605, "lr": 2.46861334993409e-05, "epoch": 1.9431998631910683, "percentage": 99.42, "elapsed_time": "1 day, 18:00:10", "remaining_time": "0:14:34", "throughput": 333.0, "total_tokens": 50353728} {"current_steps": 39775, "total_steps": 40000, "loss": 0.0457, "lr": 2.3629063091384903e-05, "epoch": 1.9434441648547627, "percentage": 99.44, "elapsed_time": "1 day, 18:00:13", "remaining_time": "0:14:15", "throughput": 333.04, "total_tokens": 50360224} {"current_steps": 39780, "total_steps": 40000, "loss": 0.0539, "lr": 2.2595120924567834e-05, "epoch": 1.943688466518457, "percentage": 99.45, "elapsed_time": "1 day, 18:00:16", "remaining_time": "0:13:56", "throughput": 333.07, "total_tokens": 50366176} {"current_steps": 39785, "total_steps": 40000, "loss": 0.0447, "lr": 2.158430715829551e-05, "epoch": 1.9439327681821514, "percentage": 99.46, "elapsed_time": "1 day, 18:00:19", "remaining_time": "0:13:37", "throughput": 333.11, "total_tokens": 50372320} {"current_steps": 39790, "total_steps": 40000, "loss": 0.033, "lr": 2.059662194849321e-05, "epoch": 1.9441770698458456, "percentage": 99.48, "elapsed_time": "1 day, 18:00:22", "remaining_time": "0:13:18", "throughput": 333.14, "total_tokens": 50378944} {"current_steps": 39795, "total_steps": 40000, "loss": 0.062, "lr": 1.9632065447422463e-05, "epoch": 1.94442137150954, "percentage": 99.49, "elapsed_time": "1 day, 18:00:25", "remaining_time": "0:12:59", "throughput": 333.18, "total_tokens": 50385152} {"current_steps": 39800, "total_steps": 40000, "loss": 0.0443, "lr": 1.8690637803880916e-05, "epoch": 1.9446656731732344, "percentage": 99.5, "elapsed_time": "1 day, 18:00:28", "remaining_time": "0:12:39", "throughput": 333.21, "total_tokens": 50391680} {"current_steps": 39800, "total_steps": 40000, "eval_loss": 0.06055711209774017, "epoch": 1.9446656731732344, "percentage": 99.5, "elapsed_time": "1 day, 18:11:07", "remaining_time": "0:12:43", "throughput": 331.81, "total_tokens": 50391680} {"current_steps": 39805, "total_steps": 40000, "loss": 0.0656, "lr": 1.7772339163019123e-05, "epoch": 1.9449099748369285, "percentage": 99.51, "elapsed_time": "1 day, 18:11:11", "remaining_time": "0:12:23", "throughput": 331.85, "total_tokens": 50398464} {"current_steps": 39810, "total_steps": 40000, "loss": 0.0435, "lr": 1.6877169666457138e-05, "epoch": 1.945154276500623, "percentage": 99.52, "elapsed_time": "1 day, 18:11:14", "remaining_time": "0:12:04", "throughput": 331.89, "total_tokens": 50404800} {"current_steps": 39815, "total_steps": 40000, "loss": 0.0765, "lr": 1.6005129452234532e-05, "epoch": 1.9453985781643173, "percentage": 99.54, "elapsed_time": "1 day, 18:11:17", "remaining_time": "0:11:45", "throughput": 331.92, "total_tokens": 50411104} {"current_steps": 39820, "total_steps": 40000, "loss": 0.0576, "lr": 1.5156218654843733e-05, "epoch": 1.9456428798280117, "percentage": 99.55, "elapsed_time": "1 day, 18:11:20", "remaining_time": "0:11:26", "throughput": 331.96, "total_tokens": 50417632} {"current_steps": 39825, "total_steps": 40000, "loss": 0.063, "lr": 1.4330437405196683e-05, "epoch": 1.945887181491706, "percentage": 99.56, "elapsed_time": "1 day, 18:11:23", "remaining_time": "0:11:07", "throughput": 331.99, "total_tokens": 50424192} {"current_steps": 39830, "total_steps": 40000, "loss": 0.1167, "lr": 1.352778583062486e-05, "epoch": 1.9461314831554004, "percentage": 99.58, "elapsed_time": "1 day, 18:11:26", "remaining_time": "0:10:48", "throughput": 332.03, "total_tokens": 50430912} {"current_steps": 39835, "total_steps": 40000, "loss": 0.0428, "lr": 1.2748264054929237e-05, "epoch": 1.9463757848190946, "percentage": 99.59, "elapsed_time": "1 day, 18:11:29", "remaining_time": "0:10:29", "throughput": 332.07, "total_tokens": 50437344} {"current_steps": 39840, "total_steps": 40000, "loss": 0.0641, "lr": 1.1991872198297004e-05, "epoch": 1.946620086482789, "percentage": 99.6, "elapsed_time": "1 day, 18:11:32", "remaining_time": "0:10:10", "throughput": 332.1, "total_tokens": 50443904} {"current_steps": 39845, "total_steps": 40000, "loss": 0.0782, "lr": 1.1258610377384847e-05, "epoch": 1.9468643881464833, "percentage": 99.61, "elapsed_time": "1 day, 18:11:35", "remaining_time": "0:09:50", "throughput": 332.14, "total_tokens": 50450464} {"current_steps": 39850, "total_steps": 40000, "loss": 0.0648, "lr": 1.0548478705268982e-05, "epoch": 1.9471086898101775, "percentage": 99.62, "elapsed_time": "1 day, 18:11:38", "remaining_time": "0:09:31", "throughput": 332.17, "total_tokens": 50456640} {"current_steps": 39855, "total_steps": 40000, "loss": 0.0575, "lr": 9.86147729147846e-06, "epoch": 1.9473529914738719, "percentage": 99.64, "elapsed_time": "1 day, 18:11:41", "remaining_time": "0:09:12", "throughput": 332.21, "total_tokens": 50462848} {"current_steps": 39860, "total_steps": 40000, "loss": 0.0596, "lr": 9.197606241928557e-06, "epoch": 1.9475972931375662, "percentage": 99.65, "elapsed_time": "1 day, 18:11:44", "remaining_time": "0:08:53", "throughput": 332.24, "total_tokens": 50469248} {"current_steps": 39865, "total_steps": 40000, "loss": 0.049, "lr": 8.556865659004042e-06, "epoch": 1.9478415948012606, "percentage": 99.66, "elapsed_time": "1 day, 18:11:48", "remaining_time": "0:08:34", "throughput": 332.28, "total_tokens": 50475936} {"current_steps": 39870, "total_steps": 40000, "loss": 0.0482, "lr": 7.939255641525867e-06, "epoch": 1.948085896464955, "percentage": 99.67, "elapsed_time": "1 day, 18:11:51", "remaining_time": "0:08:15", "throughput": 332.31, "total_tokens": 50481696} {"current_steps": 39875, "total_steps": 40000, "loss": 0.0855, "lr": 7.344776284751164e-06, "epoch": 1.9483301981286494, "percentage": 99.69, "elapsed_time": "1 day, 18:11:54", "remaining_time": "0:07:56", "throughput": 332.35, "total_tokens": 50488192} {"current_steps": 39880, "total_steps": 40000, "loss": 0.0435, "lr": 6.773427680323296e-06, "epoch": 1.9485744997923435, "percentage": 99.7, "elapsed_time": "1 day, 18:11:57", "remaining_time": "0:07:37", "throughput": 332.38, "total_tokens": 50494880} {"current_steps": 39885, "total_steps": 40000, "loss": 0.0581, "lr": 6.225209916355112e-06, "epoch": 1.948818801456038, "percentage": 99.71, "elapsed_time": "1 day, 18:12:00", "remaining_time": "0:07:18", "throughput": 332.42, "total_tokens": 50501056} {"current_steps": 39890, "total_steps": 40000, "loss": 0.0661, "lr": 5.7001230774123e-06, "epoch": 1.9490631031197323, "percentage": 99.72, "elapsed_time": "1 day, 18:12:03", "remaining_time": "0:06:58", "throughput": 332.45, "total_tokens": 50507488} {"current_steps": 39895, "total_steps": 40000, "loss": 0.0947, "lr": 5.198167244446772e-06, "epoch": 1.9493074047834265, "percentage": 99.74, "elapsed_time": "1 day, 18:12:06", "remaining_time": "0:06:39", "throughput": 332.49, "total_tokens": 50513472} {"current_steps": 39900, "total_steps": 40000, "loss": 0.0493, "lr": 4.71934249487993e-06, "epoch": 1.9495517064471208, "percentage": 99.75, "elapsed_time": "1 day, 18:12:09", "remaining_time": "0:06:20", "throughput": 332.52, "total_tokens": 50519520} {"current_steps": 39905, "total_steps": 40000, "loss": 0.0343, "lr": 4.2636489025527075e-06, "epoch": 1.9497960081108152, "percentage": 99.76, "elapsed_time": "1 day, 18:12:12", "remaining_time": "0:06:01", "throughput": 332.55, "total_tokens": 50525408} {"current_steps": 39910, "total_steps": 40000, "loss": 0.062, "lr": 3.831086537742223e-06, "epoch": 1.9500403097745096, "percentage": 99.78, "elapsed_time": "1 day, 18:12:15", "remaining_time": "0:05:42", "throughput": 332.59, "total_tokens": 50531616} {"current_steps": 39915, "total_steps": 40000, "loss": 0.0776, "lr": 3.4216554671451236e-06, "epoch": 1.950284611438204, "percentage": 99.79, "elapsed_time": "1 day, 18:12:18", "remaining_time": "0:05:23", "throughput": 332.63, "total_tokens": 50538912} {"current_steps": 39920, "total_steps": 40000, "loss": 0.0587, "lr": 3.035355753894242e-06, "epoch": 1.9505289131018984, "percentage": 99.8, "elapsed_time": "1 day, 18:12:21", "remaining_time": "0:05:04", "throughput": 332.66, "total_tokens": 50545216} {"current_steps": 39925, "total_steps": 40000, "loss": 0.0331, "lr": 2.6721874575752477e-06, "epoch": 1.9507732147655925, "percentage": 99.81, "elapsed_time": "1 day, 18:12:24", "remaining_time": "0:04:45", "throughput": 332.7, "total_tokens": 50551680} {"current_steps": 39930, "total_steps": 40000, "loss": 0.0486, "lr": 2.3321506341933418e-06, "epoch": 1.951017516429287, "percentage": 99.83, "elapsed_time": "1 day, 18:12:28", "remaining_time": "0:04:26", "throughput": 332.73, "total_tokens": 50558144} {"current_steps": 39935, "total_steps": 40000, "loss": 0.0523, "lr": 2.0152453361732546e-06, "epoch": 1.951261818092981, "percentage": 99.84, "elapsed_time": "1 day, 18:12:31", "remaining_time": "0:04:07", "throughput": 332.76, "total_tokens": 50563936} {"current_steps": 39940, "total_steps": 40000, "loss": 0.0493, "lr": 1.7214716123925554e-06, "epoch": 1.9515061197566754, "percentage": 99.85, "elapsed_time": "1 day, 18:12:34", "remaining_time": "0:03:48", "throughput": 332.8, "total_tokens": 50569952} {"current_steps": 39945, "total_steps": 40000, "loss": 0.0712, "lr": 1.4508295081649968e-06, "epoch": 1.9517504214203698, "percentage": 99.86, "elapsed_time": "1 day, 18:12:37", "remaining_time": "0:03:29", "throughput": 332.83, "total_tokens": 50576480} {"current_steps": 39950, "total_steps": 40000, "loss": 0.0722, "lr": 1.2033190652238623e-06, "epoch": 1.9519947230840642, "percentage": 99.88, "elapsed_time": "1 day, 18:12:40", "remaining_time": "0:03:10", "throughput": 332.87, "total_tokens": 50582688} {"current_steps": 39955, "total_steps": 40000, "loss": 0.0531, "lr": 9.78940321721966e-07, "epoch": 1.9522390247477586, "percentage": 99.89, "elapsed_time": "1 day, 18:12:43", "remaining_time": "0:02:51", "throughput": 332.9, "total_tokens": 50589088} {"current_steps": 39960, "total_steps": 40000, "loss": 0.0423, "lr": 7.776933122816132e-07, "epoch": 1.952483326411453, "percentage": 99.9, "elapsed_time": "1 day, 18:12:46", "remaining_time": "0:02:32", "throughput": 332.94, "total_tokens": 50595232} {"current_steps": 39965, "total_steps": 40000, "loss": 0.0893, "lr": 5.99578067927986e-07, "epoch": 1.9527276280751473, "percentage": 99.91, "elapsed_time": "1 day, 18:12:49", "remaining_time": "0:02:13", "throughput": 332.97, "total_tokens": 50601728} {"current_steps": 39970, "total_steps": 40000, "loss": 0.0362, "lr": 4.445946161224512e-07, "epoch": 1.9529719297388415, "percentage": 99.92, "elapsed_time": "1 day, 18:12:52", "remaining_time": "0:01:54", "throughput": 333.01, "total_tokens": 50608544} {"current_steps": 39975, "total_steps": 40000, "loss": 0.0555, "lr": 3.127429807792126e-07, "epoch": 1.9532162314025359, "percentage": 99.94, "elapsed_time": "1 day, 18:12:55", "remaining_time": "0:01:35", "throughput": 333.05, "total_tokens": 50615232} {"current_steps": 39980, "total_steps": 40000, "loss": 0.0521, "lr": 2.040231822320049e-07, "epoch": 1.95346053306623, "percentage": 99.95, "elapsed_time": "1 day, 18:12:59", "remaining_time": "0:01:16", "throughput": 333.08, "total_tokens": 50621952} {"current_steps": 39985, "total_steps": 40000, "loss": 0.0542, "lr": 1.1843523723409354e-07, "epoch": 1.9537048347299244, "percentage": 99.96, "elapsed_time": "1 day, 18:13:02", "remaining_time": "0:00:57", "throughput": 333.12, "total_tokens": 50628768} {"current_steps": 39990, "total_steps": 40000, "loss": 0.0338, "lr": 5.597915897492811e-08, "epoch": 1.9539491363936188, "percentage": 99.98, "elapsed_time": "1 day, 18:13:05", "remaining_time": "0:00:38", "throughput": 333.16, "total_tokens": 50635136} {"current_steps": 39995, "total_steps": 40000, "loss": 0.0799, "lr": 1.6654957113448885e-08, "epoch": 1.9541934380573132, "percentage": 99.99, "elapsed_time": "1 day, 18:13:08", "remaining_time": "0:00:19", "throughput": 333.19, "total_tokens": 50641088} {"current_steps": 40000, "total_steps": 40000, "loss": 0.0409, "lr": 4.626377114735902e-10, "epoch": 1.9544377397210075, "percentage": 100.0, "elapsed_time": "1 day, 18:13:11", "remaining_time": "0:00:00", "throughput": 333.22, "total_tokens": 50647232} {"current_steps": 40000, "total_steps": 40000, "eval_loss": 0.06056767329573631, "epoch": 1.9544377397210075, "percentage": 100.0, "elapsed_time": "1 day, 18:23:49", "remaining_time": "0:00:00", "throughput": 331.83, "total_tokens": 50647232} {"current_steps": 40000, "total_steps": 40000, "epoch": 1.9544377397210075, "percentage": 100.0, "elapsed_time": "1 day, 18:23:51", "remaining_time": "0:00:00", "throughput": 331.83, "total_tokens": 50647232}