|
{ |
|
"epoch": 4.9728, |
|
"eval_validation.parquet_accuracy": 0.8558, |
|
"eval_validation.parquet_accuracy__0": 0.8627450980392157, |
|
"eval_validation.parquet_accuracy__1": 0.7607361963190185, |
|
"eval_validation.parquet_accuracy__10": 0.9035294117647059, |
|
"eval_validation.parquet_accuracy__11": 0.8764478764478765, |
|
"eval_validation.parquet_accuracy__12": 0.8980667838312829, |
|
"eval_validation.parquet_accuracy__13": 0.7473118279569892, |
|
"eval_validation.parquet_accuracy__14": 0.839943342776204, |
|
"eval_validation.parquet_accuracy__15": 0.8427947598253275, |
|
"eval_validation.parquet_accuracy__16": 0.830945558739255, |
|
"eval_validation.parquet_accuracy__17": 0.839527027027027, |
|
"eval_validation.parquet_accuracy__18": 0.8801369863013698, |
|
"eval_validation.parquet_accuracy__19": 0.8117647058823529, |
|
"eval_validation.parquet_accuracy__2": 0.7860696517412935, |
|
"eval_validation.parquet_accuracy__20": 0.7633802816901408, |
|
"eval_validation.parquet_accuracy__21": 0.9289617486338798, |
|
"eval_validation.parquet_accuracy__22": 0.8562691131498471, |
|
"eval_validation.parquet_accuracy__23": 0.8805460750853242, |
|
"eval_validation.parquet_accuracy__3": 0.8660714285714286, |
|
"eval_validation.parquet_accuracy__4": 0.8530884808013356, |
|
"eval_validation.parquet_accuracy__5": 0.8694029850746269, |
|
"eval_validation.parquet_accuracy__6": 0.900117508813161, |
|
"eval_validation.parquet_accuracy__7": 0.7741935483870968, |
|
"eval_validation.parquet_accuracy__8": 0.8904494382022472, |
|
"eval_validation.parquet_accuracy__9": 0.8669833729216152, |
|
"eval_validation.parquet_accuracy_conf50": 0.8663669799754802, |
|
"eval_validation.parquet_accuracy_conf50__0": 0.8712871287128713, |
|
"eval_validation.parquet_accuracy_conf50__1": 0.7711598746081505, |
|
"eval_validation.parquet_accuracy_conf50__10": 0.9078014184397163, |
|
"eval_validation.parquet_accuracy_conf50__11": 0.8823529411764706, |
|
"eval_validation.parquet_accuracy_conf50__12": 0.9089285714285714, |
|
"eval_validation.parquet_accuracy_conf50__13": 0.7828571428571428, |
|
"eval_validation.parquet_accuracy_conf50__14": 0.8511560693641619, |
|
"eval_validation.parquet_accuracy_conf50__15": 0.8565022421524664, |
|
"eval_validation.parquet_accuracy_conf50__16": 0.8357771260997068, |
|
"eval_validation.parquet_accuracy_conf50__17": 0.8456260720411664, |
|
"eval_validation.parquet_accuracy_conf50__18": 0.8858131487889274, |
|
"eval_validation.parquet_accuracy_conf50__19": 0.8277945619335347, |
|
"eval_validation.parquet_accuracy_conf50__2": 0.8041237113402062, |
|
"eval_validation.parquet_accuracy_conf50__20": 0.7794117647058824, |
|
"eval_validation.parquet_accuracy_conf50__21": 0.9312242090784044, |
|
"eval_validation.parquet_accuracy_conf50__22": 0.8710691823899371, |
|
"eval_validation.parquet_accuracy_conf50__23": 0.8797250859106529, |
|
"eval_validation.parquet_accuracy_conf50__3": 0.8885448916408669, |
|
"eval_validation.parquet_accuracy_conf50__4": 0.8637137989778535, |
|
"eval_validation.parquet_accuracy_conf50__5": 0.8816793893129771, |
|
"eval_validation.parquet_accuracy_conf50__6": 0.9115890083632019, |
|
"eval_validation.parquet_accuracy_conf50__7": 0.7850678733031674, |
|
"eval_validation.parquet_accuracy_conf50__8": 0.8923512747875354, |
|
"eval_validation.parquet_accuracy_conf50__9": 0.878345498783455, |
|
"eval_validation.parquet_accuracy_conf75": 0.9145129224652088, |
|
"eval_validation.parquet_accuracy_conf75__0": 0.9239130434782609, |
|
"eval_validation.parquet_accuracy_conf75__1": 0.85546875, |
|
"eval_validation.parquet_accuracy_conf75__10": 0.9493670886075949, |
|
"eval_validation.parquet_accuracy_conf75__11": 0.9121338912133892, |
|
"eval_validation.parquet_accuracy_conf75__12": 0.9450980392156862, |
|
"eval_validation.parquet_accuracy_conf75__13": 0.8294573643410853, |
|
"eval_validation.parquet_accuracy_conf75__14": 0.9129692832764505, |
|
"eval_validation.parquet_accuracy_conf75__15": 0.9392265193370166, |
|
"eval_validation.parquet_accuracy_conf75__16": 0.8972602739726028, |
|
"eval_validation.parquet_accuracy_conf75__17": 0.8893280632411067, |
|
"eval_validation.parquet_accuracy_conf75__18": 0.9288389513108615, |
|
"eval_validation.parquet_accuracy_conf75__19": 0.8925925925925926, |
|
"eval_validation.parquet_accuracy_conf75__2": 0.8809523809523809, |
|
"eval_validation.parquet_accuracy_conf75__20": 0.8479087452471483, |
|
"eval_validation.parquet_accuracy_conf75__21": 0.9502923976608187, |
|
"eval_validation.parquet_accuracy_conf75__22": 0.9064748201438849, |
|
"eval_validation.parquet_accuracy_conf75__23": 0.9404761904761905, |
|
"eval_validation.parquet_accuracy_conf75__3": 0.9228070175438596, |
|
"eval_validation.parquet_accuracy_conf75__4": 0.9067961165048544, |
|
"eval_validation.parquet_accuracy_conf75__5": 0.9224137931034483, |
|
"eval_validation.parquet_accuracy_conf75__6": 0.9374185136897001, |
|
"eval_validation.parquet_accuracy_conf75__7": 0.8453333333333334, |
|
"eval_validation.parquet_accuracy_conf75__8": 0.9276729559748428, |
|
"eval_validation.parquet_accuracy_conf75__9": 0.9305354558610709, |
|
"eval_validation.parquet_accuracy_label_average": 0.8470618003326092, |
|
"eval_validation.parquet_accuracy_label_average_conf50": 0.8580792494248763, |
|
"eval_validation.parquet_accuracy_label_average_conf75": 0.9081139825449239, |
|
"eval_validation.parquet_accuracy_label_min": 0.7473118279569892, |
|
"eval_validation.parquet_accuracy_label_min_conf50": 0.7711598746081505, |
|
"eval_validation.parquet_accuracy_label_min_conf75": 0.8294573643410853, |
|
"eval_validation.parquet_loss": 0.4807276427745819, |
|
"eval_validation.parquet_proportion_conf50": 0.9788, |
|
"eval_validation.parquet_proportion_conf75": 0.8551, |
|
"eval_validation.parquet_runtime": 8.4462, |
|
"eval_validation.parquet_samples_per_second": 1183.97, |
|
"eval_validation.parquet_steps_per_second": 37.058, |
|
"num_input_tokens_seen": 1949274656, |
|
"test_accuracy": 0.8585, |
|
"test_accuracy__0": 0.9345794392523364, |
|
"test_accuracy__1": 0.7317073170731707, |
|
"test_accuracy__10": 0.9148351648351648, |
|
"test_accuracy__11": 0.89272030651341, |
|
"test_accuracy__12": 0.8687196110210696, |
|
"test_accuracy__13": 0.813953488372093, |
|
"test_accuracy__14": 0.8615819209039548, |
|
"test_accuracy__15": 0.717948717948718, |
|
"test_accuracy__16": 0.8550295857988166, |
|
"test_accuracy__17": 0.8245931283905967, |
|
"test_accuracy__18": 0.9069767441860465, |
|
"test_accuracy__19": 0.8333333333333334, |
|
"test_accuracy__2": 0.8660287081339713, |
|
"test_accuracy__20": 0.8294117647058824, |
|
"test_accuracy__21": 0.944141689373297, |
|
"test_accuracy__22": 0.8787878787878788, |
|
"test_accuracy__23": 0.9, |
|
"test_accuracy__3": 0.8470254957507082, |
|
"test_accuracy__4": 0.8442367601246106, |
|
"test_accuracy__5": 0.8188679245283019, |
|
"test_accuracy__6": 0.8996655518394648, |
|
"test_accuracy__7": 0.729490022172949, |
|
"test_accuracy__8": 0.8937329700272479, |
|
"test_accuracy__9": 0.8665105386416861, |
|
"test_accuracy_conf50": 0.8673937417184793, |
|
"test_accuracy_conf50__0": 0.9433962264150944, |
|
"test_accuracy_conf50__1": 0.7452830188679245, |
|
"test_accuracy_conf50__10": 0.9299719887955182, |
|
"test_accuracy_conf50__11": 0.8957528957528957, |
|
"test_accuracy_conf50__12": 0.8768472906403941, |
|
"test_accuracy_conf50__13": 0.8192771084337349, |
|
"test_accuracy_conf50__14": 0.8690647482014389, |
|
"test_accuracy_conf50__15": 0.7236842105263158, |
|
"test_accuracy_conf50__16": 0.8640483383685801, |
|
"test_accuracy_conf50__17": 0.8357933579335793, |
|
"test_accuracy_conf50__18": 0.91, |
|
"test_accuracy_conf50__19": 0.8480565371024735, |
|
"test_accuracy_conf50__2": 0.8768472906403941, |
|
"test_accuracy_conf50__20": 0.8433734939759037, |
|
"test_accuracy_conf50__21": 0.9504814305364512, |
|
"test_accuracy_conf50__22": 0.8843537414965986, |
|
"test_accuracy_conf50__23": 0.9028213166144201, |
|
"test_accuracy_conf50__3": 0.8571428571428571, |
|
"test_accuracy_conf50__4": 0.8510301109350238, |
|
"test_accuracy_conf50__5": 0.8206106870229007, |
|
"test_accuracy_conf50__6": 0.9071347678369196, |
|
"test_accuracy_conf50__7": 0.7441860465116279, |
|
"test_accuracy_conf50__8": 0.9005524861878453, |
|
"test_accuracy_conf50__9": 0.8760529482551144, |
|
"test_accuracy_conf75": 0.917750439367311, |
|
"test_accuracy_conf75__0": 0.95, |
|
"test_accuracy_conf75__1": 0.8412698412698413, |
|
"test_accuracy_conf75__10": 0.9556213017751479, |
|
"test_accuracy_conf75__11": 0.9297520661157025, |
|
"test_accuracy_conf75__12": 0.9298892988929889, |
|
"test_accuracy_conf75__13": 0.8787878787878788, |
|
"test_accuracy_conf75__14": 0.9126050420168067, |
|
"test_accuracy_conf75__15": 0.8253012048192772, |
|
"test_accuracy_conf75__16": 0.8885017421602788, |
|
"test_accuracy_conf75__17": 0.8968421052631579, |
|
"test_accuracy_conf75__18": 0.9379562043795621, |
|
"test_accuracy_conf75__19": 0.9112903225806451, |
|
"test_accuracy_conf75__2": 0.9028571428571428, |
|
"test_accuracy_conf75__20": 0.896551724137931, |
|
"test_accuracy_conf75__21": 0.9680232558139535, |
|
"test_accuracy_conf75__22": 0.9224806201550387, |
|
"test_accuracy_conf75__23": 0.9444444444444444, |
|
"test_accuracy_conf75__3": 0.931899641577061, |
|
"test_accuracy_conf75__4": 0.8976234003656307, |
|
"test_accuracy_conf75__5": 0.9166666666666666, |
|
"test_accuracy_conf75__6": 0.9482976040353089, |
|
"test_accuracy_conf75__7": 0.8040345821325648, |
|
"test_accuracy_conf75__8": 0.9447852760736196, |
|
"test_accuracy_conf75__9": 0.9320113314447592, |
|
"test_accuracy_label_average": 0.853078252571446, |
|
"test_accuracy_label_average_conf50": 0.8614901207580835, |
|
"test_accuracy_label_average_conf75": 0.9111455290735587, |
|
"test_accuracy_label_min": 0.717948717948718, |
|
"test_accuracy_label_min_conf50": 0.7236842105263158, |
|
"test_accuracy_label_min_conf75": 0.8040345821325648, |
|
"test_loss": 0.4694322645664215, |
|
"test_proportion_conf50": 0.9811, |
|
"test_proportion_conf75": 0.8535, |
|
"test_runtime": 8.3953, |
|
"test_samples_per_second": 1191.144, |
|
"test_steps_per_second": 37.283, |
|
"train_loss": 1.6634563641670423, |
|
"train_runtime": 573.9155, |
|
"train_samples_per_second": 696.967, |
|
"train_steps_per_second": 1.359 |
|
} |