|
{"current_steps": 100, "total_steps": 4920, "loss": 1.0073, "learning_rate": 1.0162601626016261e-06, "epoch": 0.16260162601626016, "percentage": 2.03, "elapsed_time": "0:20:42", "remaining_time": "16:37:49", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 200, "total_steps": 4920, "loss": 0.0302, "learning_rate": 2.0325203252032523e-06, "epoch": 0.3252032520325203, "percentage": 4.07, "elapsed_time": "0:41:21", "remaining_time": "16:15:54", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 300, "total_steps": 4920, "loss": 0.0229, "learning_rate": 3.0487804878048782e-06, "epoch": 0.4878048780487805, "percentage": 6.1, "elapsed_time": "1:01:57", "remaining_time": "15:54:16", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 400, "total_steps": 4920, "loss": 0.0197, "learning_rate": 4.0650406504065046e-06, "epoch": 0.6504065040650406, "percentage": 8.13, "elapsed_time": "1:22:30", "remaining_time": "15:32:18", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 500, "total_steps": 4920, "loss": 0.0183, "learning_rate": 4.999959730768458e-06, "epoch": 0.8130081300813008, "percentage": 10.16, "elapsed_time": "1:43:03", "remaining_time": "15:11:00", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 600, "total_steps": 4920, "loss": 0.0172, "learning_rate": 4.992664502959351e-06, "epoch": 0.975609756097561, "percentage": 12.2, "elapsed_time": "2:03:39", "remaining_time": "14:50:19", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 700, "total_steps": 4920, "loss": 0.0149, "learning_rate": 4.9728272933003704e-06, "epoch": 1.1382113821138211, "percentage": 14.23, "elapsed_time": "2:24:13", "remaining_time": "14:29:30", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 800, "total_steps": 4920, "loss": 0.015, "learning_rate": 4.940547913829274e-06, "epoch": 1.3008130081300813, "percentage": 16.26, "elapsed_time": "2:44:42", "remaining_time": "14:08:14", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 900, "total_steps": 4920, "loss": 0.0147, "learning_rate": 4.89598878006206e-06, "epoch": 1.4634146341463414, "percentage": 18.29, "elapsed_time": "3:05:11", "remaining_time": "13:47:10", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1000, "total_steps": 4920, "loss": 0.0144, "learning_rate": 4.839374093790139e-06, "epoch": 1.6260162601626016, "percentage": 20.33, "elapsed_time": "3:25:40", "remaining_time": "13:26:13", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1000, "total_steps": 4920, "eval_loss": 0.014762421138584614, "epoch": 1.6260162601626016, "percentage": 20.33, "elapsed_time": "3:29:32", "remaining_time": "13:41:25", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1100, "total_steps": 4920, "loss": 0.0135, "learning_rate": 4.770988714996401e-06, "epoch": 1.7886178861788617, "percentage": 22.36, "elapsed_time": "3:51:25", "remaining_time": "13:23:39", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1200, "total_steps": 4920, "loss": 0.0138, "learning_rate": 4.691176728566159e-06, "epoch": 1.951219512195122, "percentage": 24.39, "elapsed_time": "4:11:57", "remaining_time": "13:01:02", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1300, "total_steps": 4920, "loss": 0.0109, "learning_rate": 4.600339713004673e-06, "epoch": 2.113821138211382, "percentage": 26.42, "elapsed_time": "4:32:29", "remaining_time": "12:38:48", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1400, "total_steps": 4920, "loss": 0.011, "learning_rate": 4.498934719872278e-06, "epoch": 2.2764227642276422, "percentage": 28.46, "elapsed_time": "4:52:59", "remaining_time": "12:16:39", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1500, "total_steps": 4920, "loss": 0.0109, "learning_rate": 4.387471974103713e-06, "epoch": 2.4390243902439024, "percentage": 30.49, "elapsed_time": "5:13:30", "remaining_time": "11:54:48", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1600, "total_steps": 4920, "loss": 0.0113, "learning_rate": 4.266512306782628e-06, "epoch": 2.6016260162601625, "percentage": 32.52, "elapsed_time": "5:34:02", "remaining_time": "11:33:08", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1700, "total_steps": 4920, "loss": 0.0111, "learning_rate": 4.136664333288392e-06, "epoch": 2.7642276422764227, "percentage": 34.55, "elapsed_time": "5:54:33", "remaining_time": "11:11:34", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1800, "total_steps": 4920, "loss": 0.0104, "learning_rate": 3.998581391013531e-06, "epoch": 2.926829268292683, "percentage": 36.59, "elapsed_time": "6:15:06", "remaining_time": "10:50:10", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 1900, "total_steps": 4920, "loss": 0.0082, "learning_rate": 3.8529582520598395e-06, "epoch": 3.089430894308943, "percentage": 38.62, "elapsed_time": "6:35:39", "remaining_time": "10:28:52", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2000, "total_steps": 4920, "loss": 0.0068, "learning_rate": 3.7005276274534145e-06, "epoch": 3.252032520325203, "percentage": 40.65, "elapsed_time": "6:56:09", "remaining_time": "10:07:35", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2000, "total_steps": 4920, "eval_loss": 0.01827162876725197, "epoch": 3.252032520325203, "percentage": 40.65, "elapsed_time": "6:59:53", "remaining_time": "10:13:02", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2100, "total_steps": 4920, "loss": 0.0077, "learning_rate": 3.5420564804678583e-06, "epoch": 3.4146341463414633, "percentage": 42.68, "elapsed_time": "7:21:29", "remaining_time": "9:52:51", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2200, "total_steps": 4920, "loss": 0.0073, "learning_rate": 3.378342167605362e-06, "epoch": 3.5772357723577235, "percentage": 44.72, "elapsed_time": "7:42:02", "remaining_time": "9:31:15", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2300, "total_steps": 4920, "loss": 0.0074, "learning_rate": 3.21020842665256e-06, "epoch": 3.7398373983739837, "percentage": 46.75, "elapsed_time": "8:02:34", "remaining_time": "9:09:43", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2400, "total_steps": 4920, "loss": 0.0069, "learning_rate": 3.038501231997454e-06, "epoch": 3.902439024390244, "percentage": 48.78, "elapsed_time": "8:23:03", "remaining_time": "8:48:13", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2500, "total_steps": 4920, "loss": 0.0052, "learning_rate": 2.8640845380616257e-06, "epoch": 4.065040650406504, "percentage": 50.81, "elapsed_time": "8:43:36", "remaining_time": "8:26:50", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2600, "total_steps": 4920, "loss": 0.0029, "learning_rate": 2.6878359322649085e-06, "epoch": 4.227642276422764, "percentage": 52.85, "elapsed_time": "9:04:07", "remaining_time": "8:05:31", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2700, "total_steps": 4920, "loss": 0.0034, "learning_rate": 2.510642219394847e-06, "epoch": 4.390243902439025, "percentage": 54.88, "elapsed_time": "9:24:38", "remaining_time": "7:44:15", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2800, "total_steps": 4920, "loss": 0.0032, "learning_rate": 2.3333949595984614e-06, "epoch": 4.5528455284552845, "percentage": 56.91, "elapsed_time": "9:45:11", "remaining_time": "7:23:04", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 2900, "total_steps": 4920, "loss": 0.0033, "learning_rate": 2.1569859824471445e-06, "epoch": 4.715447154471545, "percentage": 58.94, "elapsed_time": "10:05:41", "remaining_time": "7:01:53", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3000, "total_steps": 4920, "loss": 0.003, "learning_rate": 1.9823028996459487e-06, "epoch": 4.878048780487805, "percentage": 60.98, "elapsed_time": "10:26:11", "remaining_time": "6:40:45", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3000, "total_steps": 4920, "eval_loss": 0.02072063274681568, "epoch": 4.878048780487805, "percentage": 60.98, "elapsed_time": "10:29:55", "remaining_time": "6:43:08", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3100, "total_steps": 4920, "loss": 0.0021, "learning_rate": 1.8102246389652839e-06, "epoch": 5.040650406504065, "percentage": 63.01, "elapsed_time": "10:52:57", "remaining_time": "6:23:20", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3200, "total_steps": 4920, "loss": 0.0007, "learning_rate": 1.6416170218663446e-06, "epoch": 5.203252032520325, "percentage": 65.04, "elapsed_time": "11:13:30", "remaining_time": "6:02:00", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3300, "total_steps": 4920, "loss": 0.0008, "learning_rate": 1.4773284070716504e-06, "epoch": 5.365853658536586, "percentage": 67.07, "elapsed_time": "11:33:59", "remaining_time": "5:40:40", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3400, "total_steps": 4920, "loss": 0.0007, "learning_rate": 1.3181854220003568e-06, "epoch": 5.528455284552845, "percentage": 69.11, "elapsed_time": "11:54:27", "remaining_time": "5:19:24", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3500, "total_steps": 4920, "loss": 0.0007, "learning_rate": 1.164988803545826e-06, "epoch": 5.691056910569106, "percentage": 71.14, "elapsed_time": "12:14:59", "remaining_time": "4:58:11", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3600, "total_steps": 4920, "loss": 0.0008, "learning_rate": 1.0185093691228535e-06, "epoch": 5.853658536585366, "percentage": 73.17, "elapsed_time": "12:35:34", "remaining_time": "4:37:02", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3700, "total_steps": 4920, "loss": 0.0006, "learning_rate": 8.794841382564212e-07, "epoch": 6.016260162601626, "percentage": 75.2, "elapsed_time": "12:56:06", "remaining_time": "4:15:54", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3800, "total_steps": 4920, "loss": 0.0001, "learning_rate": 7.486126242264469e-07, "epoch": 6.178861788617886, "percentage": 77.24, "elapsed_time": "13:16:36", "remaining_time": "3:54:47", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 3900, "total_steps": 4920, "loss": 0.0001, "learning_rate": 6.265533144273175e-07, "epoch": 6.341463414634147, "percentage": 79.27, "elapsed_time": "13:37:08", "remaining_time": "3:33:42", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4000, "total_steps": 4920, "loss": 0.0001, "learning_rate": 5.139203571514673e-07, "epoch": 6.504065040650406, "percentage": 81.3, "elapsed_time": "13:57:41", "remaining_time": "3:12:40", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4000, "total_steps": 4920, "eval_loss": 0.03588717430830002, "epoch": 6.504065040650406, "percentage": 81.3, "elapsed_time": "14:01:26", "remaining_time": "3:13:31", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4100, "total_steps": 4920, "loss": 0.0001, "learning_rate": 4.1128047146765936e-07, "epoch": 6.666666666666667, "percentage": 83.33, "elapsed_time": "14:24:11", "remaining_time": "2:52:50", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4200, "total_steps": 4920, "loss": 0.0001, "learning_rate": 3.191500957420626e-07, "epoch": 6.829268292682927, "percentage": 85.37, "elapsed_time": "14:44:46", "remaining_time": "2:31:40", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4300, "total_steps": 4920, "loss": 0.0001, "learning_rate": 2.3799278914952957e-07, "epoch": 6.991869918699187, "percentage": 87.4, "elapsed_time": "15:05:19", "remaining_time": "2:10:32", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4400, "total_steps": 4920, "loss": 0.0, "learning_rate": 1.682168992494923e-07, "epoch": 7.154471544715447, "percentage": 89.43, "elapsed_time": "15:25:53", "remaining_time": "1:49:25", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4500, "total_steps": 4920, "loss": 0.0, "learning_rate": 1.1017350736221927e-07, "epoch": 7.317073170731708, "percentage": 91.46, "elapsed_time": "15:46:25", "remaining_time": "1:28:20", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4600, "total_steps": 4920, "loss": 0.0, "learning_rate": 6.415466208337662e-08, "epoch": 7.479674796747967, "percentage": 93.5, "elapsed_time": "16:06:59", "remaining_time": "1:07:16", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4700, "total_steps": 4920, "loss": 0.0, "learning_rate": 3.039190982506823e-08, "epoch": 7.642276422764228, "percentage": 95.53, "elapsed_time": "16:27:32", "remaining_time": "0:46:13", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4800, "total_steps": 4920, "loss": 0.0, "learning_rate": 9.055129777021664e-09, "epoch": 7.804878048780488, "percentage": 97.56, "elapsed_time": "16:48:04", "remaining_time": "0:25:12", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4900, "total_steps": 4920, "loss": 0.0, "learning_rate": 2.5167914987633825e-10, "epoch": 7.967479674796748, "percentage": 99.59, "elapsed_time": "17:08:36", "remaining_time": "0:04:11", "throughput": "0.00", "total_tokens": 0} |
|
{"current_steps": 4920, "total_steps": 4920, "epoch": 8.0, "percentage": 100.0, "elapsed_time": "17:14:54", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} |
|
|