dclm_baseline_openthoughts1 / trainer_log.jsonl
reinhardh's picture
Training in progress, step 10
5d49675 verified
raw
history blame
9.91 kB
{"current_steps": 1, "total_steps": 7210, "loss": 0.9952, "lr": 1.3869625520110959e-08, "epoch": 0.0006934812760055479, "percentage": 0.01, "elapsed_time": "0:00:18", "remaining_time": "1 day, 13:38:06"}
{"current_steps": 2, "total_steps": 7210, "loss": 1.023, "lr": 2.7739251040221917e-08, "epoch": 0.0013869625520110957, "percentage": 0.03, "elapsed_time": "0:00:20", "remaining_time": "20:34:02"}
{"current_steps": 3, "total_steps": 7210, "loss": 1.0586, "lr": 4.1608876560332874e-08, "epoch": 0.0020804438280166435, "percentage": 0.04, "elapsed_time": "0:00:22", "remaining_time": "14:47:38"}
{"current_steps": 4, "total_steps": 7210, "loss": 1.0157, "lr": 5.5478502080443834e-08, "epoch": 0.0027739251040221915, "percentage": 0.06, "elapsed_time": "0:00:23", "remaining_time": "11:52:52"}
{"current_steps": 5, "total_steps": 7210, "loss": 1.0226, "lr": 6.93481276005548e-08, "epoch": 0.0034674063800277394, "percentage": 0.07, "elapsed_time": "0:00:25", "remaining_time": "10:08:08"}
{"current_steps": 6, "total_steps": 7210, "loss": 1.1396, "lr": 8.321775312066575e-08, "epoch": 0.004160887656033287, "percentage": 0.08, "elapsed_time": "0:00:26", "remaining_time": "8:58:13"}
{"current_steps": 7, "total_steps": 7210, "loss": 1.0319, "lr": 9.70873786407767e-08, "epoch": 0.0048543689320388345, "percentage": 0.1, "elapsed_time": "0:00:28", "remaining_time": "8:08:25"}
{"current_steps": 8, "total_steps": 7210, "loss": 1.0091, "lr": 1.1095700416088767e-07, "epoch": 0.005547850208044383, "percentage": 0.11, "elapsed_time": "0:00:30", "remaining_time": "7:30:51"}
{"current_steps": 9, "total_steps": 7210, "loss": 1.0236, "lr": 1.2482662968099862e-07, "epoch": 0.0062413314840499305, "percentage": 0.12, "elapsed_time": "0:00:31", "remaining_time": "7:01:37"}
{"current_steps": 10, "total_steps": 7210, "loss": 1.0949, "lr": 1.386962552011096e-07, "epoch": 0.006934812760055479, "percentage": 0.14, "elapsed_time": "0:00:33", "remaining_time": "6:38:14"}
{"current_steps": 11, "total_steps": 7210, "loss": 1.0223, "lr": 1.5256588072122053e-07, "epoch": 0.0076282940360610264, "percentage": 0.15, "elapsed_time": "0:03:17", "remaining_time": "1 day, 11:58:25"}
{"current_steps": 12, "total_steps": 7210, "loss": 1.0643, "lr": 1.664355062413315e-07, "epoch": 0.008321775312066574, "percentage": 0.17, "elapsed_time": "0:03:19", "remaining_time": "1 day, 9:15:30"}
{"current_steps": 13, "total_steps": 7210, "loss": 1.0264, "lr": 1.8030513176144244e-07, "epoch": 0.009015256588072122, "percentage": 0.18, "elapsed_time": "0:03:21", "remaining_time": "1 day, 6:56:31"}
{"current_steps": 14, "total_steps": 7210, "loss": 1.084, "lr": 1.941747572815534e-07, "epoch": 0.009708737864077669, "percentage": 0.19, "elapsed_time": "0:03:22", "remaining_time": "1 day, 4:56:46"}
{"current_steps": 15, "total_steps": 7210, "loss": 1.0181, "lr": 2.080443828016644e-07, "epoch": 0.010402219140083218, "percentage": 0.21, "elapsed_time": "0:03:24", "remaining_time": "1 day, 3:13:26"}
{"current_steps": 16, "total_steps": 7210, "loss": 1.0885, "lr": 2.2191400832177534e-07, "epoch": 0.011095700416088766, "percentage": 0.22, "elapsed_time": "0:03:25", "remaining_time": "1 day, 1:42:59"}
{"current_steps": 17, "total_steps": 7210, "loss": 0.9954, "lr": 2.3578363384188628e-07, "epoch": 0.011789181692094313, "percentage": 0.24, "elapsed_time": "0:03:27", "remaining_time": "1 day, 0:23:36"}
{"current_steps": 18, "total_steps": 7210, "loss": 1.011, "lr": 2.4965325936199724e-07, "epoch": 0.012482662968099861, "percentage": 0.25, "elapsed_time": "0:03:29", "remaining_time": "23:15:10"}
{"current_steps": 19, "total_steps": 7210, "loss": 1.0184, "lr": 2.635228848821082e-07, "epoch": 0.013176144244105409, "percentage": 0.26, "elapsed_time": "0:03:31", "remaining_time": "22:11:35"}
{"current_steps": 20, "total_steps": 7210, "loss": 1.1128, "lr": 2.773925104022192e-07, "epoch": 0.013869625520110958, "percentage": 0.28, "elapsed_time": "0:03:32", "remaining_time": "21:14:16"}
{"current_steps": 21, "total_steps": 7210, "loss": 1.0416, "lr": 2.9126213592233014e-07, "epoch": 0.014563106796116505, "percentage": 0.29, "elapsed_time": "0:05:10", "remaining_time": "1 day, 5:30:45"}
{"current_steps": 22, "total_steps": 7210, "loss": 1.0272, "lr": 3.0513176144244106e-07, "epoch": 0.015256588072122053, "percentage": 0.31, "elapsed_time": "0:05:11", "remaining_time": "1 day, 4:18:42"}
{"current_steps": 23, "total_steps": 7210, "loss": 1.0815, "lr": 3.19001386962552e-07, "epoch": 0.0159500693481276, "percentage": 0.32, "elapsed_time": "0:05:13", "remaining_time": "1 day, 3:12:51"}
{"current_steps": 24, "total_steps": 7210, "loss": 1.0639, "lr": 3.32871012482663e-07, "epoch": 0.016643550624133148, "percentage": 0.33, "elapsed_time": "0:05:15", "remaining_time": "1 day, 2:12:37"}
{"current_steps": 25, "total_steps": 7210, "loss": 1.0609, "lr": 3.4674063800277396e-07, "epoch": 0.017337031900138695, "percentage": 0.35, "elapsed_time": "0:05:16", "remaining_time": "1 day, 1:17:05"}
{"current_steps": 26, "total_steps": 7210, "loss": 0.9867, "lr": 3.6061026352288487e-07, "epoch": 0.018030513176144243, "percentage": 0.36, "elapsed_time": "0:05:18", "remaining_time": "1 day, 0:25:47"}
{"current_steps": 27, "total_steps": 7210, "loss": 1.0453, "lr": 3.7447988904299584e-07, "epoch": 0.01872399445214979, "percentage": 0.37, "elapsed_time": "0:05:19", "remaining_time": "23:38:20"}
{"current_steps": 28, "total_steps": 7210, "loss": 1.0749, "lr": 3.883495145631068e-07, "epoch": 0.019417475728155338, "percentage": 0.39, "elapsed_time": "0:05:21", "remaining_time": "22:54:14"}
{"current_steps": 29, "total_steps": 7210, "loss": 1.0681, "lr": 4.022191400832178e-07, "epoch": 0.02011095700416089, "percentage": 0.4, "elapsed_time": "0:05:23", "remaining_time": "22:13:12"}
{"current_steps": 30, "total_steps": 7210, "loss": 0.9954, "lr": 4.160887656033288e-07, "epoch": 0.020804438280166437, "percentage": 0.42, "elapsed_time": "0:05:24", "remaining_time": "21:34:56"}
{"current_steps": 31, "total_steps": 7210, "loss": 0.9347, "lr": 4.299583911234397e-07, "epoch": 0.021497919556171984, "percentage": 0.43, "elapsed_time": "0:06:47", "remaining_time": "1 day, 2:13:29"}
{"current_steps": 32, "total_steps": 7210, "loss": 0.9633, "lr": 4.4382801664355067e-07, "epoch": 0.022191400832177532, "percentage": 0.44, "elapsed_time": "0:06:49", "remaining_time": "1 day, 1:30:00"}
{"current_steps": 33, "total_steps": 7210, "loss": 1.0212, "lr": 4.5769764216366164e-07, "epoch": 0.02288488210818308, "percentage": 0.46, "elapsed_time": "0:06:50", "remaining_time": "1 day, 0:49:11"}
{"current_steps": 34, "total_steps": 7210, "loss": 1.0028, "lr": 4.7156726768377255e-07, "epoch": 0.023578363384188627, "percentage": 0.47, "elapsed_time": "0:06:52", "remaining_time": "1 day, 0:10:45"}
{"current_steps": 35, "total_steps": 7210, "loss": 0.9346, "lr": 4.854368932038835e-07, "epoch": 0.024271844660194174, "percentage": 0.49, "elapsed_time": "0:06:53", "remaining_time": "23:34:29"}
{"current_steps": 36, "total_steps": 7210, "loss": 1.0298, "lr": 4.993065187239945e-07, "epoch": 0.024965325936199722, "percentage": 0.5, "elapsed_time": "0:06:55", "remaining_time": "23:00:21"}
{"current_steps": 37, "total_steps": 7210, "loss": 1.0371, "lr": 5.131761442441055e-07, "epoch": 0.02565880721220527, "percentage": 0.51, "elapsed_time": "0:06:57", "remaining_time": "22:27:57"}
{"current_steps": 38, "total_steps": 7210, "loss": 1.0255, "lr": 5.270457697642164e-07, "epoch": 0.026352288488210817, "percentage": 0.53, "elapsed_time": "0:06:58", "remaining_time": "21:57:12"}
{"current_steps": 39, "total_steps": 7210, "loss": 0.9796, "lr": 5.409153952843274e-07, "epoch": 0.027045769764216365, "percentage": 0.54, "elapsed_time": "0:07:00", "remaining_time": "21:28:08"}
{"current_steps": 40, "total_steps": 7210, "loss": 0.999, "lr": 5.547850208044384e-07, "epoch": 0.027739251040221916, "percentage": 0.55, "elapsed_time": "0:07:01", "remaining_time": "21:00:32"}
{"current_steps": 41, "total_steps": 7210, "loss": 1.0615, "lr": 5.686546463245493e-07, "epoch": 0.028432732316227463, "percentage": 0.57, "elapsed_time": "0:08:30", "remaining_time": "1 day, 0:47:40"}
{"current_steps": 42, "total_steps": 7210, "loss": 0.937, "lr": 5.825242718446603e-07, "epoch": 0.02912621359223301, "percentage": 0.58, "elapsed_time": "0:08:32", "remaining_time": "1 day, 0:16:32"}
{"current_steps": 43, "total_steps": 7210, "loss": 0.9696, "lr": 5.963938973647713e-07, "epoch": 0.029819694868238558, "percentage": 0.6, "elapsed_time": "0:08:33", "remaining_time": "23:46:51"}
{"current_steps": 44, "total_steps": 7210, "loss": 1.0647, "lr": 6.102635228848821e-07, "epoch": 0.030513176144244106, "percentage": 0.61, "elapsed_time": "0:08:35", "remaining_time": "23:18:30"}
{"current_steps": 45, "total_steps": 7210, "loss": 1.0183, "lr": 6.241331484049931e-07, "epoch": 0.031206657420249653, "percentage": 0.62, "elapsed_time": "0:08:36", "remaining_time": "22:51:24"}
{"current_steps": 46, "total_steps": 7210, "loss": 1.0248, "lr": 6.38002773925104e-07, "epoch": 0.0319001386962552, "percentage": 0.64, "elapsed_time": "0:08:38", "remaining_time": "22:25:32"}
{"current_steps": 47, "total_steps": 7210, "loss": 0.9586, "lr": 6.51872399445215e-07, "epoch": 0.03259361997226075, "percentage": 0.65, "elapsed_time": "0:08:39", "remaining_time": "22:00:43"}
{"current_steps": 48, "total_steps": 7210, "loss": 1.0394, "lr": 6.65742024965326e-07, "epoch": 0.033287101248266296, "percentage": 0.67, "elapsed_time": "0:08:41", "remaining_time": "21:36:58"}
{"current_steps": 49, "total_steps": 7210, "loss": 1.0005, "lr": 6.79611650485437e-07, "epoch": 0.03398058252427184, "percentage": 0.68, "elapsed_time": "0:08:43", "remaining_time": "21:14:10"}
{"current_steps": 50, "total_steps": 7210, "loss": 1.0294, "lr": 6.934812760055479e-07, "epoch": 0.03467406380027739, "percentage": 0.69, "elapsed_time": "0:08:44", "remaining_time": "20:52:17"}