{"current_steps": 5, "total_steps": 154, "loss": 4.5691, "lr": 4.991681456235483e-05, "epoch": 0.06493506493506493, "percentage": 3.25, "elapsed_time": "0:00:03", "remaining_time": "0:01:35", "throughput": 62.1, "total_tokens": 200} {"current_steps": 10, "total_steps": 154, "loss": 5.3026, "lr": 4.9579822269987574e-05, "epoch": 0.12987012987012986, "percentage": 6.49, "elapsed_time": "0:00:04", "remaining_time": "0:01:11", "throughput": 75.87, "total_tokens": 376} {"current_steps": 15, "total_steps": 154, "loss": 3.9166, "lr": 4.898732434036244e-05, "epoch": 0.19480519480519481, "percentage": 9.74, "elapsed_time": "0:00:06", "remaining_time": "0:01:01", "throughput": 88.53, "total_tokens": 592} {"current_steps": 20, "total_steps": 154, "loss": 4.0923, "lr": 4.814547975052245e-05, "epoch": 0.2597402597402597, "percentage": 12.99, "elapsed_time": "0:00:08", "remaining_time": "0:00:56", "throughput": 95.14, "total_tokens": 800} {"current_steps": 25, "total_steps": 154, "loss": 3.5885, "lr": 4.7063039419658035e-05, "epoch": 0.3246753246753247, "percentage": 16.23, "elapsed_time": "0:00:10", "remaining_time": "0:00:52", "throughput": 97.7, "total_tokens": 992} {"current_steps": 30, "total_steps": 154, "loss": 2.6237, "lr": 4.5751255243877015e-05, "epoch": 0.38961038961038963, "percentage": 19.48, "elapsed_time": "0:00:11", "remaining_time": "0:00:49", "throughput": 97.48, "total_tokens": 1160} {"current_steps": 35, "total_steps": 154, "loss": 2.1141, "lr": 4.422376313348405e-05, "epoch": 0.45454545454545453, "percentage": 22.73, "elapsed_time": "0:00:13", "remaining_time": "0:00:46", "throughput": 101.49, "total_tokens": 1384} {"current_steps": 40, "total_steps": 154, "loss": 1.6475, "lr": 4.2496441268589046e-05, "epoch": 0.5194805194805194, "percentage": 25.97, "elapsed_time": "0:00:15", "remaining_time": "0:00:43", "throughput": 103.08, "total_tokens": 1584} {"current_steps": 45, "total_steps": 154, "loss": 2.3441, "lr": 4.058724504646834e-05, "epoch": 0.5844155844155844, "percentage": 29.22, "elapsed_time": "0:00:17", "remaining_time": "0:00:41", "throughput": 104.38, "total_tokens": 1784} {"current_steps": 50, "total_steps": 154, "loss": 1.6557, "lr": 3.851602043638994e-05, "epoch": 0.6493506493506493, "percentage": 32.47, "elapsed_time": "0:00:18", "remaining_time": "0:00:39", "throughput": 106.73, "total_tokens": 2008} {"current_steps": 55, "total_steps": 154, "loss": 1.4454, "lr": 3.6304297682067144e-05, "epoch": 0.7142857142857143, "percentage": 35.71, "elapsed_time": "0:00:20", "remaining_time": "0:00:36", "throughput": 107.12, "total_tokens": 2200} {"current_steps": 60, "total_steps": 154, "loss": 1.6826, "lr": 3.3975067496189965e-05, "epoch": 0.7792207792207793, "percentage": 38.96, "elapsed_time": "0:00:22", "remaining_time": "0:00:34", "throughput": 109.86, "total_tokens": 2448} {"current_steps": 65, "total_steps": 154, "loss": 1.4454, "lr": 3.1552542073477555e-05, "epoch": 0.8441558441558441, "percentage": 42.21, "elapsed_time": "0:00:24", "remaining_time": "0:00:32", "throughput": 110.47, "total_tokens": 2656} {"current_steps": 70, "total_steps": 154, "loss": 1.4228, "lr": 2.9061903406505154e-05, "epoch": 0.9090909090909091, "percentage": 45.45, "elapsed_time": "0:00:25", "remaining_time": "0:00:30", "throughput": 111.97, "total_tokens": 2888} {"current_steps": 75, "total_steps": 154, "loss": 1.3693, "lr": 2.652904152054607e-05, "epoch": 0.974025974025974, "percentage": 48.7, "elapsed_time": "0:00:27", "remaining_time": "0:00:28", "throughput": 111.97, "total_tokens": 3080} {"current_steps": 80, "total_steps": 154, "loss": 1.9372, "lr": 2.3980285348460363e-05, "epoch": 1.0389610389610389, "percentage": 51.95, "elapsed_time": "0:00:29", "remaining_time": "0:00:27", "throughput": 111.97, "total_tokens": 3272} {"current_steps": 85, "total_steps": 154, "loss": 1.0038, "lr": 2.1442129043167874e-05, "epoch": 1.103896103896104, "percentage": 55.19, "elapsed_time": "0:00:30", "remaining_time": "0:00:25", "throughput": 111.68, "total_tokens": 3456} {"current_steps": 90, "total_steps": 154, "loss": 1.0141, "lr": 1.8940956572669692e-05, "epoch": 1.1688311688311688, "percentage": 58.44, "elapsed_time": "0:00:32", "remaining_time": "0:00:23", "throughput": 111.68, "total_tokens": 3648} {"current_steps": 95, "total_steps": 154, "loss": 0.9873, "lr": 1.6502767460434588e-05, "epoch": 1.2337662337662338, "percentage": 61.69, "elapsed_time": "0:00:34", "remaining_time": "0:00:21", "throughput": 112.14, "total_tokens": 3856} {"current_steps": 100, "total_steps": 154, "loss": 1.4175, "lr": 1.4152906522061048e-05, "epoch": 1.2987012987012987, "percentage": 64.94, "elapsed_time": "0:00:36", "remaining_time": "0:00:19", "throughput": 114.73, "total_tokens": 4144} {"current_steps": 100, "total_steps": 154, "eval_loss": 1.2581640481948853, "epoch": 1.2987012987012987, "percentage": 64.94, "elapsed_time": "0:00:37", "remaining_time": "0:00:20", "throughput": 111.23, "total_tokens": 4144} {"current_steps": 105, "total_steps": 154, "loss": 1.7128, "lr": 1.1915800407584704e-05, "epoch": 1.3636363636363638, "percentage": 68.18, "elapsed_time": "0:00:40", "remaining_time": "0:00:18", "throughput": 109.02, "total_tokens": 4368} {"current_steps": 110, "total_steps": 154, "loss": 0.8593, "lr": 9.814703688056321e-06, "epoch": 1.4285714285714286, "percentage": 71.43, "elapsed_time": "0:00:41", "remaining_time": "0:00:16", "throughput": 109.1, "total_tokens": 4560} {"current_steps": 115, "total_steps": 154, "loss": 1.2189, "lr": 7.871457125803896e-06, "epoch": 1.4935064935064934, "percentage": 74.68, "elapsed_time": "0:00:43", "remaining_time": "0:00:14", "throughput": 108.77, "total_tokens": 4736} {"current_steps": 120, "total_steps": 154, "loss": 1.0924, "lr": 6.106260641143546e-06, "epoch": 1.5584415584415585, "percentage": 77.92, "elapsed_time": "0:00:45", "remaining_time": "0:00:12", "throughput": 108.35, "total_tokens": 4928} {"current_steps": 125, "total_steps": 154, "loss": 1.422, "lr": 4.537463335535161e-06, "epoch": 1.6233766233766234, "percentage": 81.17, "elapsed_time": "0:00:47", "remaining_time": "0:00:10", "throughput": 108.96, "total_tokens": 5152} {"current_steps": 130, "total_steps": 154, "loss": 1.0191, "lr": 3.181372753878595e-06, "epoch": 1.6883116883116882, "percentage": 84.42, "elapsed_time": "0:00:49", "remaining_time": "0:00:09", "throughput": 109.35, "total_tokens": 5360} {"current_steps": 135, "total_steps": 154, "loss": 1.0357, "lr": 2.0520853686560178e-06, "epoch": 1.7532467532467533, "percentage": 87.66, "elapsed_time": "0:00:50", "remaining_time": "0:00:07", "throughput": 109.57, "total_tokens": 5560} {"current_steps": 140, "total_steps": 154, "loss": 0.9097, "lr": 1.1613400480268099e-06, "epoch": 1.8181818181818183, "percentage": 90.91, "elapsed_time": "0:00:52", "remaining_time": "0:00:05", "throughput": 109.2, "total_tokens": 5728} {"current_steps": 145, "total_steps": 154, "loss": 0.8963, "lr": 5.183960310644748e-07, "epoch": 1.883116883116883, "percentage": 94.16, "elapsed_time": "0:00:54", "remaining_time": "0:00:03", "throughput": 109.45, "total_tokens": 5928} {"current_steps": 150, "total_steps": 154, "loss": 1.2464, "lr": 1.29936678574899e-07, "epoch": 1.948051948051948, "percentage": 97.4, "elapsed_time": "0:00:55", "remaining_time": "0:00:01", "throughput": 109.81, "total_tokens": 6136} {"current_steps": 154, "total_steps": 154, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:00:58", "remaining_time": "0:00:00", "throughput": 107.9, "total_tokens": 6288}