{ "epoch": 4.9728, "eval_validation.parquet_accuracy": 0.8558, "eval_validation.parquet_accuracy__0": 0.8627450980392157, "eval_validation.parquet_accuracy__1": 0.7607361963190185, "eval_validation.parquet_accuracy__10": 0.9035294117647059, "eval_validation.parquet_accuracy__11": 0.8764478764478765, "eval_validation.parquet_accuracy__12": 0.8980667838312829, "eval_validation.parquet_accuracy__13": 0.7473118279569892, "eval_validation.parquet_accuracy__14": 0.839943342776204, "eval_validation.parquet_accuracy__15": 0.8427947598253275, "eval_validation.parquet_accuracy__16": 0.830945558739255, "eval_validation.parquet_accuracy__17": 0.839527027027027, "eval_validation.parquet_accuracy__18": 0.8801369863013698, "eval_validation.parquet_accuracy__19": 0.8117647058823529, "eval_validation.parquet_accuracy__2": 0.7860696517412935, "eval_validation.parquet_accuracy__20": 0.7633802816901408, "eval_validation.parquet_accuracy__21": 0.9289617486338798, "eval_validation.parquet_accuracy__22": 0.8562691131498471, "eval_validation.parquet_accuracy__23": 0.8805460750853242, "eval_validation.parquet_accuracy__3": 0.8660714285714286, "eval_validation.parquet_accuracy__4": 0.8530884808013356, "eval_validation.parquet_accuracy__5": 0.8694029850746269, "eval_validation.parquet_accuracy__6": 0.900117508813161, "eval_validation.parquet_accuracy__7": 0.7741935483870968, "eval_validation.parquet_accuracy__8": 0.8904494382022472, "eval_validation.parquet_accuracy__9": 0.8669833729216152, "eval_validation.parquet_accuracy_conf50": 0.8663669799754802, "eval_validation.parquet_accuracy_conf50__0": 0.8712871287128713, "eval_validation.parquet_accuracy_conf50__1": 0.7711598746081505, "eval_validation.parquet_accuracy_conf50__10": 0.9078014184397163, "eval_validation.parquet_accuracy_conf50__11": 0.8823529411764706, "eval_validation.parquet_accuracy_conf50__12": 0.9089285714285714, "eval_validation.parquet_accuracy_conf50__13": 0.7828571428571428, "eval_validation.parquet_accuracy_conf50__14": 0.8511560693641619, "eval_validation.parquet_accuracy_conf50__15": 0.8565022421524664, "eval_validation.parquet_accuracy_conf50__16": 0.8357771260997068, "eval_validation.parquet_accuracy_conf50__17": 0.8456260720411664, "eval_validation.parquet_accuracy_conf50__18": 0.8858131487889274, "eval_validation.parquet_accuracy_conf50__19": 0.8277945619335347, "eval_validation.parquet_accuracy_conf50__2": 0.8041237113402062, "eval_validation.parquet_accuracy_conf50__20": 0.7794117647058824, "eval_validation.parquet_accuracy_conf50__21": 0.9312242090784044, "eval_validation.parquet_accuracy_conf50__22": 0.8710691823899371, "eval_validation.parquet_accuracy_conf50__23": 0.8797250859106529, "eval_validation.parquet_accuracy_conf50__3": 0.8885448916408669, "eval_validation.parquet_accuracy_conf50__4": 0.8637137989778535, "eval_validation.parquet_accuracy_conf50__5": 0.8816793893129771, "eval_validation.parquet_accuracy_conf50__6": 0.9115890083632019, "eval_validation.parquet_accuracy_conf50__7": 0.7850678733031674, "eval_validation.parquet_accuracy_conf50__8": 0.8923512747875354, "eval_validation.parquet_accuracy_conf50__9": 0.878345498783455, "eval_validation.parquet_accuracy_conf75": 0.9145129224652088, "eval_validation.parquet_accuracy_conf75__0": 0.9239130434782609, "eval_validation.parquet_accuracy_conf75__1": 0.85546875, "eval_validation.parquet_accuracy_conf75__10": 0.9493670886075949, "eval_validation.parquet_accuracy_conf75__11": 0.9121338912133892, "eval_validation.parquet_accuracy_conf75__12": 0.9450980392156862, "eval_validation.parquet_accuracy_conf75__13": 0.8294573643410853, "eval_validation.parquet_accuracy_conf75__14": 0.9129692832764505, "eval_validation.parquet_accuracy_conf75__15": 0.9392265193370166, "eval_validation.parquet_accuracy_conf75__16": 0.8972602739726028, "eval_validation.parquet_accuracy_conf75__17": 0.8893280632411067, "eval_validation.parquet_accuracy_conf75__18": 0.9288389513108615, "eval_validation.parquet_accuracy_conf75__19": 0.8925925925925926, "eval_validation.parquet_accuracy_conf75__2": 0.8809523809523809, "eval_validation.parquet_accuracy_conf75__20": 0.8479087452471483, "eval_validation.parquet_accuracy_conf75__21": 0.9502923976608187, "eval_validation.parquet_accuracy_conf75__22": 0.9064748201438849, "eval_validation.parquet_accuracy_conf75__23": 0.9404761904761905, "eval_validation.parquet_accuracy_conf75__3": 0.9228070175438596, "eval_validation.parquet_accuracy_conf75__4": 0.9067961165048544, "eval_validation.parquet_accuracy_conf75__5": 0.9224137931034483, "eval_validation.parquet_accuracy_conf75__6": 0.9374185136897001, "eval_validation.parquet_accuracy_conf75__7": 0.8453333333333334, "eval_validation.parquet_accuracy_conf75__8": 0.9276729559748428, "eval_validation.parquet_accuracy_conf75__9": 0.9305354558610709, "eval_validation.parquet_accuracy_label_average": 0.8470618003326092, "eval_validation.parquet_accuracy_label_average_conf50": 0.8580792494248763, "eval_validation.parquet_accuracy_label_average_conf75": 0.9081139825449239, "eval_validation.parquet_accuracy_label_min": 0.7473118279569892, "eval_validation.parquet_accuracy_label_min_conf50": 0.7711598746081505, "eval_validation.parquet_accuracy_label_min_conf75": 0.8294573643410853, "eval_validation.parquet_loss": 0.4807276427745819, "eval_validation.parquet_proportion_conf50": 0.9788, "eval_validation.parquet_proportion_conf75": 0.8551, "eval_validation.parquet_runtime": 8.4462, "eval_validation.parquet_samples_per_second": 1183.97, "eval_validation.parquet_steps_per_second": 37.058, "num_input_tokens_seen": 1949274656, "test_accuracy": 0.8585, "test_accuracy__0": 0.9345794392523364, "test_accuracy__1": 0.7317073170731707, "test_accuracy__10": 0.9148351648351648, "test_accuracy__11": 0.89272030651341, "test_accuracy__12": 0.8687196110210696, "test_accuracy__13": 0.813953488372093, "test_accuracy__14": 0.8615819209039548, "test_accuracy__15": 0.717948717948718, "test_accuracy__16": 0.8550295857988166, "test_accuracy__17": 0.8245931283905967, "test_accuracy__18": 0.9069767441860465, "test_accuracy__19": 0.8333333333333334, "test_accuracy__2": 0.8660287081339713, "test_accuracy__20": 0.8294117647058824, "test_accuracy__21": 0.944141689373297, "test_accuracy__22": 0.8787878787878788, "test_accuracy__23": 0.9, "test_accuracy__3": 0.8470254957507082, "test_accuracy__4": 0.8442367601246106, "test_accuracy__5": 0.8188679245283019, "test_accuracy__6": 0.8996655518394648, "test_accuracy__7": 0.729490022172949, "test_accuracy__8": 0.8937329700272479, "test_accuracy__9": 0.8665105386416861, "test_accuracy_conf50": 0.8673937417184793, "test_accuracy_conf50__0": 0.9433962264150944, "test_accuracy_conf50__1": 0.7452830188679245, "test_accuracy_conf50__10": 0.9299719887955182, "test_accuracy_conf50__11": 0.8957528957528957, "test_accuracy_conf50__12": 0.8768472906403941, "test_accuracy_conf50__13": 0.8192771084337349, "test_accuracy_conf50__14": 0.8690647482014389, "test_accuracy_conf50__15": 0.7236842105263158, "test_accuracy_conf50__16": 0.8640483383685801, "test_accuracy_conf50__17": 0.8357933579335793, "test_accuracy_conf50__18": 0.91, "test_accuracy_conf50__19": 0.8480565371024735, "test_accuracy_conf50__2": 0.8768472906403941, "test_accuracy_conf50__20": 0.8433734939759037, "test_accuracy_conf50__21": 0.9504814305364512, "test_accuracy_conf50__22": 0.8843537414965986, "test_accuracy_conf50__23": 0.9028213166144201, "test_accuracy_conf50__3": 0.8571428571428571, "test_accuracy_conf50__4": 0.8510301109350238, "test_accuracy_conf50__5": 0.8206106870229007, "test_accuracy_conf50__6": 0.9071347678369196, "test_accuracy_conf50__7": 0.7441860465116279, "test_accuracy_conf50__8": 0.9005524861878453, "test_accuracy_conf50__9": 0.8760529482551144, "test_accuracy_conf75": 0.917750439367311, "test_accuracy_conf75__0": 0.95, "test_accuracy_conf75__1": 0.8412698412698413, "test_accuracy_conf75__10": 0.9556213017751479, "test_accuracy_conf75__11": 0.9297520661157025, "test_accuracy_conf75__12": 0.9298892988929889, "test_accuracy_conf75__13": 0.8787878787878788, "test_accuracy_conf75__14": 0.9126050420168067, "test_accuracy_conf75__15": 0.8253012048192772, "test_accuracy_conf75__16": 0.8885017421602788, "test_accuracy_conf75__17": 0.8968421052631579, "test_accuracy_conf75__18": 0.9379562043795621, "test_accuracy_conf75__19": 0.9112903225806451, "test_accuracy_conf75__2": 0.9028571428571428, "test_accuracy_conf75__20": 0.896551724137931, "test_accuracy_conf75__21": 0.9680232558139535, "test_accuracy_conf75__22": 0.9224806201550387, "test_accuracy_conf75__23": 0.9444444444444444, "test_accuracy_conf75__3": 0.931899641577061, "test_accuracy_conf75__4": 0.8976234003656307, "test_accuracy_conf75__5": 0.9166666666666666, "test_accuracy_conf75__6": 0.9482976040353089, "test_accuracy_conf75__7": 0.8040345821325648, "test_accuracy_conf75__8": 0.9447852760736196, "test_accuracy_conf75__9": 0.9320113314447592, "test_accuracy_label_average": 0.853078252571446, "test_accuracy_label_average_conf50": 0.8614901207580835, "test_accuracy_label_average_conf75": 0.9111455290735587, "test_accuracy_label_min": 0.717948717948718, "test_accuracy_label_min_conf50": 0.7236842105263158, "test_accuracy_label_min_conf75": 0.8040345821325648, "test_loss": 0.4694322645664215, "test_proportion_conf50": 0.9811, "test_proportion_conf75": 0.8535, "test_runtime": 8.3953, "test_samples_per_second": 1191.144, "test_steps_per_second": 37.283, "train_loss": 1.6634563641670423, "train_runtime": 573.9155, "train_samples_per_second": 696.967, "train_steps_per_second": 1.359 }