|
{ |
|
"best_global_step": 471, |
|
"best_metric": 0.7473118279569892, |
|
"best_model_checkpoint": "/linkhome/rech/genini01/udd26kf/scratch/weborganizer/models/runs/answerdotai--ModernBERT-base_TopicAnnotations-Llama-3.1-8B_bsz512_lr1e-4_epochs5_warmup0.1_url1_TopicAnnotations-Llama-3.1-405B-FP8_bsz512_lr1e-4_epochs5_warmup0.1_url1/checkpoint-471", |
|
"epoch": 4.9728, |
|
"eval_steps": 500, |
|
"global_step": 780, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.64, |
|
"grad_norm": 8.25, |
|
"learning_rate": 9.686609686609687e-05, |
|
"loss": 2.1544, |
|
"num_input_tokens_seen": 249204064, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_validation.parquet_accuracy": 0.8451, |
|
"eval_validation.parquet_accuracy__0": 0.9019607843137255, |
|
"eval_validation.parquet_accuracy__1": 0.7975460122699386, |
|
"eval_validation.parquet_accuracy__10": 0.9105882352941177, |
|
"eval_validation.parquet_accuracy__11": 0.8687258687258688, |
|
"eval_validation.parquet_accuracy__12": 0.8734622144112478, |
|
"eval_validation.parquet_accuracy__13": 0.6827956989247311, |
|
"eval_validation.parquet_accuracy__14": 0.8229461756373938, |
|
"eval_validation.parquet_accuracy__15": 0.8427947598253275, |
|
"eval_validation.parquet_accuracy__16": 0.8194842406876791, |
|
"eval_validation.parquet_accuracy__17": 0.8260135135135135, |
|
"eval_validation.parquet_accuracy__18": 0.8732876712328768, |
|
"eval_validation.parquet_accuracy__19": 0.861764705882353, |
|
"eval_validation.parquet_accuracy__2": 0.8159203980099502, |
|
"eval_validation.parquet_accuracy__20": 0.7183098591549296, |
|
"eval_validation.parquet_accuracy__21": 0.8975409836065574, |
|
"eval_validation.parquet_accuracy__22": 0.7981651376146789, |
|
"eval_validation.parquet_accuracy__23": 0.863481228668942, |
|
"eval_validation.parquet_accuracy__3": 0.9017857142857143, |
|
"eval_validation.parquet_accuracy__4": 0.8697829716193656, |
|
"eval_validation.parquet_accuracy__5": 0.8246268656716418, |
|
"eval_validation.parquet_accuracy__6": 0.8907168037602821, |
|
"eval_validation.parquet_accuracy__7": 0.7784946236559139, |
|
"eval_validation.parquet_accuracy__8": 0.8932584269662921, |
|
"eval_validation.parquet_accuracy__9": 0.8230403800475059, |
|
"eval_validation.parquet_accuracy_conf50": 0.8559460563955864, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.9108910891089109, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.8087774294670846, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9148936170212766, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.8745098039215686, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.8857142857142857, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7085714285714285, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.8338150289017341, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8609865470852018, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8240469208211144, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8319039451114922, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8788927335640139, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.8761329305135952, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8350515463917526, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.7323529411764705, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.9009628610729024, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8113207547169812, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.865979381443299, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.9195046439628483, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.8807495741056218, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8358778625954199, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.9020310633213859, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.7986425339366516, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.8951841359773371, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.8345498783454988, |
|
"eval_validation.parquet_accuracy_conf75": 0.9065606361829026, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.967391304347826, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.8828125, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9493670886075949, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9037656903765691, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9176470588235294, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.7906976744186046, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.9027303754266212, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9281767955801105, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.886986301369863, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.8814229249011858, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9176029962546817, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.9185185185185185, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.9047619047619048, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8022813688212928, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9327485380116959, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.8741007194244604, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9246031746031746, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9473684210526315, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.9242718446601942, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.8879310344827587, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9322033898305084, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.848, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.9339622641509434, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.9001447178002895, |
|
"eval_validation.parquet_accuracy_label_average": 0.8398538864075228, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8508892890353281, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.9024790252593734, |
|
"eval_validation.parquet_accuracy_label_min": 0.6827956989247311, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7085714285714285, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.7906976744186046, |
|
"eval_validation.parquet_loss": 0.5004527568817139, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 10.52, |
|
"eval_validation.parquet_samples_per_second": 950.571, |
|
"eval_validation.parquet_steps_per_second": 29.753, |
|
"num_input_tokens_seen": 390215936, |
|
"step": 157 |
|
}, |
|
{ |
|
"epoch": 1.2752, |
|
"grad_norm": 9.875, |
|
"learning_rate": 8.262108262108262e-05, |
|
"loss": 1.8475, |
|
"num_input_tokens_seen": 499147424, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.9152, |
|
"grad_norm": 7.53125, |
|
"learning_rate": 6.837606837606838e-05, |
|
"loss": 1.7317, |
|
"num_input_tokens_seen": 751160992, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_validation.parquet_accuracy": 0.8526, |
|
"eval_validation.parquet_accuracy__0": 0.8725490196078431, |
|
"eval_validation.parquet_accuracy__1": 0.8128834355828221, |
|
"eval_validation.parquet_accuracy__10": 0.9176470588235294, |
|
"eval_validation.parquet_accuracy__11": 0.9073359073359073, |
|
"eval_validation.parquet_accuracy__12": 0.9138840070298769, |
|
"eval_validation.parquet_accuracy__13": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy__14": 0.7818696883852692, |
|
"eval_validation.parquet_accuracy__15": 0.8427947598253275, |
|
"eval_validation.parquet_accuracy__16": 0.8481375358166189, |
|
"eval_validation.parquet_accuracy__17": 0.8733108108108109, |
|
"eval_validation.parquet_accuracy__18": 0.8732876712328768, |
|
"eval_validation.parquet_accuracy__19": 0.8205882352941176, |
|
"eval_validation.parquet_accuracy__2": 0.7860696517412935, |
|
"eval_validation.parquet_accuracy__20": 0.7830985915492957, |
|
"eval_validation.parquet_accuracy__21": 0.9344262295081968, |
|
"eval_validation.parquet_accuracy__22": 0.8562691131498471, |
|
"eval_validation.parquet_accuracy__23": 0.9078498293515358, |
|
"eval_validation.parquet_accuracy__3": 0.8541666666666666, |
|
"eval_validation.parquet_accuracy__4": 0.8414023372287145, |
|
"eval_validation.parquet_accuracy__5": 0.8208955223880597, |
|
"eval_validation.parquet_accuracy__6": 0.8883666274970623, |
|
"eval_validation.parquet_accuracy__7": 0.7784946236559139, |
|
"eval_validation.parquet_accuracy__8": 0.8960674157303371, |
|
"eval_validation.parquet_accuracy__9": 0.8111638954869359, |
|
"eval_validation.parquet_accuracy_conf50": 0.8627911728647323, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.8811881188118812, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.8244514106583072, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9219858156028369, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.9137254901960784, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.9214285714285714, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7771428571428571, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.7947976878612717, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8565022421524664, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8533724340175953, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8782161234991424, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8788927335640139, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.8368580060422961, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8041237113402062, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.8, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.936726272352132, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8679245283018868, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.9072164948453608, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.8761609907120743, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.8534923339011925, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8320610687022901, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.8984468339307049, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.7873303167420814, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.8980169971671388, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.8211678832116789, |
|
"eval_validation.parquet_accuracy_conf75": 0.9124079055081277, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.9347826086956522, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.8984375, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9620253164556962, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9372384937238494, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9529411764705882, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.8294573643410853, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.8686006825938567, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9226519337016574, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.9143835616438356, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.9209486166007905, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9250936329588015, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.8962962962962963, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.8809523809523809, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8593155893536122, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9576023391812866, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.8992805755395683, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9603174603174603, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9192982456140351, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.8990291262135922, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.8879310344827587, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9282920469361148, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.84, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.9339622641509434, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.8900144717800289, |
|
"eval_validation.parquet_accuracy_label_average": 0.8485205882320762, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8592178717576693, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.909118863250162, |
|
"eval_validation.parquet_accuracy_label_min": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7771428571428571, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.8294573643410853, |
|
"eval_validation.parquet_loss": 0.4816047251224518, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 8.307, |
|
"eval_validation.parquet_samples_per_second": 1203.799, |
|
"eval_validation.parquet_steps_per_second": 37.679, |
|
"num_input_tokens_seen": 783399104, |
|
"step": 314 |
|
}, |
|
{ |
|
"epoch": 2.5504, |
|
"grad_norm": 7.59375, |
|
"learning_rate": 5.413105413105414e-05, |
|
"loss": 1.5837, |
|
"num_input_tokens_seen": 999700736, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_validation.parquet_accuracy": 0.8558, |
|
"eval_validation.parquet_accuracy__0": 0.8627450980392157, |
|
"eval_validation.parquet_accuracy__1": 0.7607361963190185, |
|
"eval_validation.parquet_accuracy__10": 0.9035294117647059, |
|
"eval_validation.parquet_accuracy__11": 0.8764478764478765, |
|
"eval_validation.parquet_accuracy__12": 0.8980667838312829, |
|
"eval_validation.parquet_accuracy__13": 0.7473118279569892, |
|
"eval_validation.parquet_accuracy__14": 0.839943342776204, |
|
"eval_validation.parquet_accuracy__15": 0.8427947598253275, |
|
"eval_validation.parquet_accuracy__16": 0.830945558739255, |
|
"eval_validation.parquet_accuracy__17": 0.839527027027027, |
|
"eval_validation.parquet_accuracy__18": 0.8801369863013698, |
|
"eval_validation.parquet_accuracy__19": 0.8117647058823529, |
|
"eval_validation.parquet_accuracy__2": 0.7860696517412935, |
|
"eval_validation.parquet_accuracy__20": 0.7633802816901408, |
|
"eval_validation.parquet_accuracy__21": 0.9289617486338798, |
|
"eval_validation.parquet_accuracy__22": 0.8562691131498471, |
|
"eval_validation.parquet_accuracy__23": 0.8805460750853242, |
|
"eval_validation.parquet_accuracy__3": 0.8660714285714286, |
|
"eval_validation.parquet_accuracy__4": 0.8530884808013356, |
|
"eval_validation.parquet_accuracy__5": 0.8694029850746269, |
|
"eval_validation.parquet_accuracy__6": 0.900117508813161, |
|
"eval_validation.parquet_accuracy__7": 0.7741935483870968, |
|
"eval_validation.parquet_accuracy__8": 0.8904494382022472, |
|
"eval_validation.parquet_accuracy__9": 0.8669833729216152, |
|
"eval_validation.parquet_accuracy_conf50": 0.8663669799754802, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.8712871287128713, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.7711598746081505, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9078014184397163, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.8823529411764706, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.9089285714285714, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7828571428571428, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.8511560693641619, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8565022421524664, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8357771260997068, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8456260720411664, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8858131487889274, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.8277945619335347, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8041237113402062, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.7794117647058824, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.9312242090784044, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8710691823899371, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.8797250859106529, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.8885448916408669, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.8637137989778535, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8816793893129771, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.9115890083632019, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.7850678733031674, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.8923512747875354, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.878345498783455, |
|
"eval_validation.parquet_accuracy_conf75": 0.9145129224652088, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.9239130434782609, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.85546875, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9493670886075949, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9121338912133892, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9450980392156862, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.8294573643410853, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.9129692832764505, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9392265193370166, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.8972602739726028, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.8893280632411067, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9288389513108615, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.8925925925925926, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.8809523809523809, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8479087452471483, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9502923976608187, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.9064748201438849, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9404761904761905, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9228070175438596, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.9067961165048544, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.9224137931034483, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9374185136897001, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.8453333333333334, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.9276729559748428, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.9305354558610709, |
|
"eval_validation.parquet_accuracy_label_average": 0.8470618003326092, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8580792494248763, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.9081139825449239, |
|
"eval_validation.parquet_accuracy_label_min": 0.7473118279569892, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7711598746081505, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.8294573643410853, |
|
"eval_validation.parquet_loss": 0.4807276427745819, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 8.2886, |
|
"eval_validation.parquet_samples_per_second": 1206.475, |
|
"eval_validation.parquet_steps_per_second": 37.763, |
|
"num_input_tokens_seen": 1176307328, |
|
"step": 471 |
|
}, |
|
{ |
|
"epoch": 3.1856, |
|
"grad_norm": 6.53125, |
|
"learning_rate": 3.988603988603989e-05, |
|
"loss": 1.5392, |
|
"num_input_tokens_seen": 1250925472, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.8256, |
|
"grad_norm": 7.0625, |
|
"learning_rate": 2.564102564102564e-05, |
|
"loss": 1.4928, |
|
"num_input_tokens_seen": 1499507040, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_validation.parquet_accuracy": 0.8567, |
|
"eval_validation.parquet_accuracy__0": 0.8725490196078431, |
|
"eval_validation.parquet_accuracy__1": 0.8006134969325154, |
|
"eval_validation.parquet_accuracy__10": 0.9105882352941177, |
|
"eval_validation.parquet_accuracy__11": 0.888030888030888, |
|
"eval_validation.parquet_accuracy__12": 0.9086115992970123, |
|
"eval_validation.parquet_accuracy__13": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy__14": 0.8271954674220963, |
|
"eval_validation.parquet_accuracy__15": 0.851528384279476, |
|
"eval_validation.parquet_accuracy__16": 0.8510028653295129, |
|
"eval_validation.parquet_accuracy__17": 0.8817567567567568, |
|
"eval_validation.parquet_accuracy__18": 0.8664383561643836, |
|
"eval_validation.parquet_accuracy__19": 0.8088235294117647, |
|
"eval_validation.parquet_accuracy__2": 0.8059701492537313, |
|
"eval_validation.parquet_accuracy__20": 0.7492957746478873, |
|
"eval_validation.parquet_accuracy__21": 0.924863387978142, |
|
"eval_validation.parquet_accuracy__22": 0.8379204892966361, |
|
"eval_validation.parquet_accuracy__23": 0.863481228668942, |
|
"eval_validation.parquet_accuracy__3": 0.8779761904761905, |
|
"eval_validation.parquet_accuracy__4": 0.8464106844741235, |
|
"eval_validation.parquet_accuracy__5": 0.8731343283582089, |
|
"eval_validation.parquet_accuracy__6": 0.881316098707403, |
|
"eval_validation.parquet_accuracy__7": 0.810752688172043, |
|
"eval_validation.parquet_accuracy__8": 0.8904494382022472, |
|
"eval_validation.parquet_accuracy__9": 0.8396674584323041, |
|
"eval_validation.parquet_accuracy_conf50": 0.8674908050674295, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.8811881188118812, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.8119122257053292, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9148936170212766, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.8980392156862745, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.9178571428571428, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7771428571428571, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.838150289017341, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8654708520179372, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8563049853372434, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8867924528301887, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8719723183391004, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.824773413897281, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8247422680412371, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.7676470588235295, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.9270976616231087, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8522012578616353, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.8625429553264605, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.9009287925696594, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.858603066439523, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8854961832061069, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.8936678614097969, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.8235294117647058, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.8923512747875354, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.8503649635036497, |
|
"eval_validation.parquet_accuracy_conf75": 0.9156823763302537, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.9347826086956522, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.88671875, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9544303797468354, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9288702928870293, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9509803921568627, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.8217054263565892, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.9027303754266212, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9392265193370166, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.910958904109589, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.9308300395256917, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9138576779026217, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.8851851851851852, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.9047619047619048, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8365019011406845, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9488304093567251, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.89568345323741, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9365079365079365, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9333333333333333, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.8932038834951457, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.9224137931034483, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9230769230769231, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.8746666666666667, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.9339622641509434, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.91027496382055, |
|
"eval_validation.parquet_accuracy_label_average": 0.8504296666277162, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8618195935008668, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.9113955826658905, |
|
"eval_validation.parquet_accuracy_label_min": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7676470588235295, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.8217054263565892, |
|
"eval_validation.parquet_loss": 0.47853514552116394, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 8.3896, |
|
"eval_validation.parquet_samples_per_second": 1191.949, |
|
"eval_validation.parquet_steps_per_second": 37.308, |
|
"num_input_tokens_seen": 1566401088, |
|
"step": 628 |
|
}, |
|
{ |
|
"epoch": 4.4608, |
|
"grad_norm": 7.5625, |
|
"learning_rate": 1.1396011396011397e-05, |
|
"loss": 1.4653, |
|
"num_input_tokens_seen": 1745927840, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.9728, |
|
"eval_validation.parquet_accuracy": 0.8571, |
|
"eval_validation.parquet_accuracy__0": 0.8725490196078431, |
|
"eval_validation.parquet_accuracy__1": 0.7914110429447853, |
|
"eval_validation.parquet_accuracy__10": 0.9105882352941177, |
|
"eval_validation.parquet_accuracy__11": 0.8918918918918919, |
|
"eval_validation.parquet_accuracy__12": 0.9033391915641477, |
|
"eval_validation.parquet_accuracy__13": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy__14": 0.8314447592067988, |
|
"eval_validation.parquet_accuracy__15": 0.8558951965065502, |
|
"eval_validation.parquet_accuracy__16": 0.8481375358166189, |
|
"eval_validation.parquet_accuracy__17": 0.875, |
|
"eval_validation.parquet_accuracy__18": 0.8595890410958904, |
|
"eval_validation.parquet_accuracy__19": 0.8117647058823529, |
|
"eval_validation.parquet_accuracy__2": 0.8109452736318408, |
|
"eval_validation.parquet_accuracy__20": 0.7436619718309859, |
|
"eval_validation.parquet_accuracy__21": 0.9262295081967213, |
|
"eval_validation.parquet_accuracy__22": 0.8440366972477065, |
|
"eval_validation.parquet_accuracy__23": 0.863481228668942, |
|
"eval_validation.parquet_accuracy__3": 0.8809523809523809, |
|
"eval_validation.parquet_accuracy__4": 0.8497495826377296, |
|
"eval_validation.parquet_accuracy__5": 0.8731343283582089, |
|
"eval_validation.parquet_accuracy__6": 0.8883666274970623, |
|
"eval_validation.parquet_accuracy__7": 0.7956989247311828, |
|
"eval_validation.parquet_accuracy__8": 0.9044943820224719, |
|
"eval_validation.parquet_accuracy__9": 0.8420427553444181, |
|
"eval_validation.parquet_accuracy_conf50": 0.8678994687372292, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.8811881188118812, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.8025078369905956, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9148936170212766, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.8980392156862745, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.9125, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7771428571428571, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.8424855491329479, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8699551569506726, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8533724340175953, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8799313893653516, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8650519031141869, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.8277945619335347, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8298969072164949, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.7647058823529411, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.9284731774415406, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8584905660377359, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.8625429553264605, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.9040247678018576, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.8620102214650767, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8854961832061069, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.9008363201911589, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.8076923076923077, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.9065155807365439, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.8527980535279805, |
|
"eval_validation.parquet_accuracy_conf75": 0.9163840486492808, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.9347826086956522, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.87890625, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9518987341772152, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9288702928870293, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9470588235294117, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.8217054263565892, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.9061433447098977, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9447513812154696, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.910958904109589, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.924901185770751, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9101123595505618, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.8888888888888888, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.9047619047619048, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8326996197718631, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9502923976608187, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.9028776978417267, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9325396825396826, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9368421052631579, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.9009708737864077, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.9224137931034483, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9308996088657105, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.864, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.940251572327044, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.9117221418234442, |
|
"eval_validation.parquet_accuracy_label_average": 0.8506808235334006, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8620143984651407, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.9116353999015111, |
|
"eval_validation.parquet_accuracy_label_min": 0.7419354838709677, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7647058823529411, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.8217054263565892, |
|
"eval_validation.parquet_loss": 0.47900858521461487, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 8.446, |
|
"eval_validation.parquet_samples_per_second": 1183.995, |
|
"eval_validation.parquet_steps_per_second": 37.059, |
|
"num_input_tokens_seen": 1949274656, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 4.9728, |
|
"num_input_tokens_seen": 1949274656, |
|
"step": 780, |
|
"total_flos": 1.297523316772307e+18, |
|
"train_loss": 1.6634563641670423, |
|
"train_runtime": 573.9155, |
|
"train_samples_per_second": 696.967, |
|
"train_steps_per_second": 1.359 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 780, |
|
"num_input_tokens_seen": 1949274656, |
|
"num_train_epochs": 5, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 1.297523316772307e+18, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|