{ "best_metric": null, "best_model_checkpoint": null, "epoch": 49.0, "eval_steps": 500, "global_step": 3969, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_B": { "f1-score": 0.8266764382557715, "precision": 0.7866108786610879, "recall": 0.871042471042471, "support": 1295.0 }, "eval_I": { "f1-score": 0.9410658617447671, "precision": 0.9344077040239768, "recall": 0.9478195863443808, "support": 20065.0 }, "eval_O": { "f1-score": 0.8562443302086484, "precision": 0.8789421405512788, "recall": 0.8346893055064262, "support": 8481.0 }, "eval_accuracy": 0.912335377500754, "eval_loss": 0.2450982630252838, "eval_macro avg": { "f1-score": 0.8746622100697291, "precision": 0.8666535744121145, "recall": 0.8845171209644261, "support": 29841.0 }, "eval_runtime": 4.6269, "eval_samples_per_second": 17.29, "eval_steps_per_second": 2.161, "eval_weighted avg": { "f1-score": 0.9119949287205363, "precision": 0.9122301519092053, "recall": 0.912335377500754, "support": 29841.0 }, "step": 81 }, { "epoch": 2.0, "eval_B": { "f1-score": 0.8833395452851286, "precision": 0.8537463976945245, "recall": 0.915057915057915, "support": 1295.0 }, "eval_I": { "f1-score": 0.9549518227873249, "precision": 0.9516903430183636, "recall": 0.958235733864939, "support": 20065.0 }, "eval_O": { "f1-score": 0.88924750463212, "precision": 0.9016969696969697, "recall": 0.877137130055418, "support": 8481.0 }, "eval_accuracy": 0.9333132267685399, "eval_loss": 0.20076116919517517, "eval_macro avg": { "f1-score": 0.9091796242348579, "precision": 0.9023779034699526, "recall": 0.916810259659424, "support": 29841.0 }, "eval_runtime": 4.6524, "eval_samples_per_second": 17.195, "eval_steps_per_second": 2.149, "eval_weighted avg": { "f1-score": 0.9331705077630417, "precision": 0.9332314707173981, "recall": 0.9333132267685399, "support": 29841.0 }, "step": 162 }, { "epoch": 3.0, "eval_B": { "f1-score": 0.8927335640138409, "precision": 0.8889739663093414, "recall": 0.8965250965250965, "support": 1295.0 }, "eval_I": { "f1-score": 0.9590235396687009, "precision": 0.9586653386454184, "recall": 0.9593820084724645, "support": 20065.0 }, "eval_O": { "f1-score": 0.9006849315068494, "precision": 0.9020697811945594, "recall": 0.8993043273198915, "support": 8481.0 }, "eval_accuracy": 0.9395797727958178, "eval_loss": 0.19863653182983398, "eval_macro avg": { "f1-score": 0.9174806783964637, "precision": 0.9165696953831063, "recall": 0.9184038107724842, "support": 29841.0 }, "eval_runtime": 4.655, "eval_samples_per_second": 17.186, "eval_steps_per_second": 2.148, "eval_weighted avg": { "f1-score": 0.9395665759512081, "precision": 0.9395561516236713, "recall": 0.9395797727958178, "support": 29841.0 }, "step": 243 }, { "epoch": 4.0, "eval_B": { "f1-score": 0.8999616711383672, "precision": 0.893455098934551, "recall": 0.9065637065637066, "support": 1295.0 }, "eval_I": { "f1-score": 0.9612657113512985, "precision": 0.9436362763454799, "recall": 0.9795664091701969, "support": 20065.0 }, "eval_O": { "f1-score": 0.8996847765622102, "precision": 0.9454403741231489, "recall": 0.8581535196321188, "support": 8481.0 }, "eval_accuracy": 0.9418920277470594, "eval_loss": 0.19743724167346954, "eval_macro avg": { "f1-score": 0.920304053017292, "precision": 0.9275105831343932, "recall": 0.9147612117886741, "support": 29841.0 }, "eval_runtime": 4.6615, "eval_samples_per_second": 17.162, "eval_steps_per_second": 2.145, "eval_weighted avg": { "f1-score": 0.9411036309913238, "precision": 0.9419713163409645, "recall": 0.9418920277470594, "support": 29841.0 }, "step": 324 }, { "epoch": 5.0, "eval_B": { "f1-score": 0.8953846153846153, "precision": 0.8919540229885058, "recall": 0.8988416988416988, "support": 1295.0 }, "eval_I": { "f1-score": 0.9602426713742261, "precision": 0.9581224570804803, "recall": 0.9623722900573137, "support": 20065.0 }, "eval_O": { "f1-score": 0.9022119433078337, "precision": 0.9075399665950847, "recall": 0.8969461148449476, "support": 8481.0 }, "eval_accuracy": 0.9410207432726785, "eval_loss": 0.2340461015701294, "eval_macro avg": { "f1-score": 0.9192797433555584, "precision": 0.9192054822213569, "recall": 0.9193867012479867, "support": 29841.0 }, "eval_runtime": 4.6719, "eval_samples_per_second": 17.124, "eval_steps_per_second": 2.14, "eval_weighted avg": { "f1-score": 0.9409353496612266, "precision": 0.9408751053176122, "recall": 0.9410207432726785, "support": 29841.0 }, "step": 405 }, { "epoch": 6.0, "eval_B": { "f1-score": 0.8929831438651511, "precision": 0.9068471337579618, "recall": 0.8795366795366796, "support": 1295.0 }, "eval_I": { "f1-score": 0.9522293798155866, "precision": 0.9655225409836066, "recall": 0.9392972838275604, "support": 20065.0 }, "eval_O": { "f1-score": 0.8885216003647556, "precision": 0.8599007170435742, "recall": 0.919113312109421, "support": 8481.0 }, "eval_accuracy": 0.930967460875976, "eval_loss": 0.21774999797344208, "eval_macro avg": { "f1-score": 0.9112447080151643, "precision": 0.9107567972617142, "recall": 0.9126490918245537, "support": 29841.0 }, "eval_runtime": 4.647, "eval_samples_per_second": 17.215, "eval_steps_per_second": 2.152, "eval_weighted avg": { "f1-score": 0.9315521386682287, "precision": 0.9329578366776978, "recall": 0.930967460875976, "support": 29841.0 }, "step": 486 }, { "epoch": 6.17, "grad_norm": 9.310327529907227, "learning_rate": 1.7530864197530865e-05, "loss": 0.1627, "step": 500 }, { "epoch": 7.0, "eval_B": { "f1-score": 0.8936490041337843, "precision": 0.8704245973645681, "recall": 0.9181467181467181, "support": 1295.0 }, "eval_I": { "f1-score": 0.9599271850630982, "precision": 0.9477800446905664, "recall": 0.9723897333665587, "support": 20065.0 }, "eval_O": { "f1-score": 0.8979841172877214, "precision": 0.9316770186335404, "recall": 0.8666430845419172, "support": 8481.0 }, "eval_accuracy": 0.9399819040916859, "eval_loss": 0.27376389503479004, "eval_macro avg": { "f1-score": 0.9171867688282013, "precision": 0.9166272202295582, "recall": 0.9190598453517312, "support": 29841.0 }, "eval_runtime": 4.6671, "eval_samples_per_second": 17.141, "eval_steps_per_second": 2.143, "eval_weighted avg": { "f1-score": 0.9394463230910989, "precision": 0.9398464945991887, "recall": 0.9399819040916859, "support": 29841.0 }, "step": 567 }, { "epoch": 8.0, "eval_B": { "f1-score": 0.8948545861297539, "precision": 0.8651766402307137, "recall": 0.9266409266409267, "support": 1295.0 }, "eval_I": { "f1-score": 0.9590139880661254, "precision": 0.9414702069429106, "recall": 0.9772240219287316, "support": 20065.0 }, "eval_O": { "f1-score": 0.8927241122423641, "precision": 0.9427035531663825, "recall": 0.8477773847423653, "support": 8481.0 }, "eval_accuracy": 0.9382393351429241, "eval_loss": 0.3103167414665222, "eval_macro avg": { "f1-score": 0.9155308954794145, "precision": 0.916450133446669, "recall": 0.9172141111040079, "support": 29841.0 }, "eval_runtime": 4.6339, "eval_samples_per_second": 17.264, "eval_steps_per_second": 2.158, "eval_weighted avg": { "f1-score": 0.9373896838414373, "precision": 0.9385098450391195, "recall": 0.9382393351429241, "support": 29841.0 }, "step": 648 }, { "epoch": 9.0, "eval_B": { "f1-score": 0.9011235955056179, "precision": 0.8749090909090909, "recall": 0.9289575289575289, "support": 1295.0 }, "eval_I": { "f1-score": 0.9615119937082186, "precision": 0.9485040973670175, "recall": 0.9748816346872664, "support": 20065.0 }, "eval_O": { "f1-score": 0.9013722126929674, "precision": 0.9380339155935229, "recall": 0.8674684589081476, "support": 8481.0 }, "eval_accuracy": 0.9423611809255722, "eval_loss": 0.32883673906326294, "eval_macro avg": { "f1-score": 0.9213359339689347, "precision": 0.9204823679565438, "recall": 0.9237692075176476, "support": 29841.0 }, "eval_runtime": 4.6714, "eval_samples_per_second": 17.126, "eval_steps_per_second": 2.141, "eval_weighted avg": { "f1-score": 0.9417992341337168, "precision": 0.9423346276781992, "recall": 0.9423611809255722, "support": 29841.0 }, "step": 729 }, { "epoch": 10.0, "eval_B": { "f1-score": 0.8935361216730039, "precision": 0.8801498127340824, "recall": 0.9073359073359073, "support": 1295.0 }, "eval_I": { "f1-score": 0.9632332861646931, "precision": 0.9596359319351009, "recall": 0.9668577124345876, "support": 20065.0 }, "eval_O": { "f1-score": 0.9095462405342556, "precision": 0.9200241254523522, "recall": 0.8993043273198915, "support": 8481.0 }, "eval_accuracy": 0.9450755671726819, "eval_loss": 0.3041447699069977, "eval_macro avg": { "f1-score": 0.9221052161239841, "precision": 0.9199366233738452, "recall": 0.9244993156967954, "support": 29841.0 }, "eval_runtime": 4.6532, "eval_samples_per_second": 17.193, "eval_steps_per_second": 2.149, "eval_weighted avg": { "f1-score": 0.9449504651463465, "precision": 0.9449285744355027, "recall": 0.9450755671726819, "support": 29841.0 }, "step": 810 }, { "epoch": 11.0, "eval_B": { "f1-score": 0.8924122310305775, "precision": 0.8729689807976366, "recall": 0.9127413127413128, "support": 1295.0 }, "eval_I": { "f1-score": 0.9588723786993913, "precision": 0.9483330083837005, "recall": 0.9696486419137802, "support": 20065.0 }, "eval_O": { "f1-score": 0.8956965718453683, "precision": 0.9243507715468574, "recall": 0.8687654757693668, "support": 8481.0 }, "eval_accuracy": 0.9385074226735028, "eval_loss": 0.3531416654586792, "eval_macro avg": { "f1-score": 0.9156603938584458, "precision": 0.9152175869093981, "recall": 0.9170518101414866, "support": 29841.0 }, "eval_runtime": 4.6508, "eval_samples_per_second": 17.201, "eval_steps_per_second": 2.15, "eval_weighted avg": { "f1-score": 0.938033267772811, "precision": 0.9382465579853486, "recall": 0.9385074226735028, "support": 29841.0 }, "step": 891 }, { "epoch": 12.0, "eval_B": { "f1-score": 0.8970199924556771, "precision": 0.8768436578171092, "recall": 0.9181467181467181, "support": 1295.0 }, "eval_I": { "f1-score": 0.9595004897159647, "precision": 0.9431046931407943, "recall": 0.9764764515325193, "support": 20065.0 }, "eval_O": { "f1-score": 0.8953122104873078, "precision": 0.9400778210116731, "recall": 0.8546162009197029, "support": 8481.0 }, "eval_accuracy": 0.9393116852652391, "eval_loss": 0.4237186312675476, "eval_macro avg": { "f1-score": 0.9172775642196499, "precision": 0.9200087239898588, "recall": 0.9164131235329801, "support": 29841.0 }, "eval_runtime": 4.6388, "eval_samples_per_second": 17.246, "eval_steps_per_second": 2.156, "eval_weighted avg": { "f1-score": 0.9385463313402296, "precision": 0.9393689288141548, "recall": 0.9393116852652391, "support": 29841.0 }, "step": 972 }, { "epoch": 12.35, "grad_norm": 0.5223535895347595, "learning_rate": 1.506172839506173e-05, "loss": 0.0196, "step": 1000 }, { "epoch": 13.0, "eval_B": { "f1-score": 0.8891411275066211, "precision": 0.8716617210682492, "recall": 0.9073359073359073, "support": 1295.0 }, "eval_I": { "f1-score": 0.9610692322951795, "precision": 0.9563736860287223, "recall": 0.9658111138798904, "support": 20065.0 }, "eval_O": { "f1-score": 0.9043145233678416, "precision": 0.918104495747266, "recall": 0.8909326730338404, "support": 8481.0 }, "eval_accuracy": 0.9419925605710264, "eval_loss": 0.4308999180793762, "eval_macro avg": { "f1-score": 0.9181749610565474, "precision": 0.9153799676147458, "recall": 0.9213598980832126, "support": 29841.0 }, "eval_runtime": 4.6555, "eval_samples_per_second": 17.184, "eval_steps_per_second": 2.148, "eval_weighted avg": { "f1-score": 0.9418177466843106, "precision": 0.9418211242043584, "recall": 0.9419925605710264, "support": 29841.0 }, "step": 1053 }, { "epoch": 14.0, "eval_B": { "f1-score": 0.9025601834161253, "precision": 0.8933434190620272, "recall": 0.911969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.960806215404473, "precision": 0.9570764513895758, "recall": 0.9645651632195366, "support": 20065.0 }, "eval_O": { "f1-score": 0.9030873763261413, "precision": 0.9131011208870676, "recall": 0.8932908855087843, "support": 8481.0 }, "eval_accuracy": 0.9420260715123487, "eval_loss": 0.4198700487613678, "eval_macro avg": { "f1-score": 0.9221512583822467, "precision": 0.9211736637795568, "recall": 0.9232750535658111, "support": 29841.0 }, "eval_runtime": 4.6834, "eval_samples_per_second": 17.082, "eval_steps_per_second": 2.135, "eval_weighted avg": { "f1-score": 0.9418744743217934, "precision": 0.9418125843993292, "recall": 0.9420260715123487, "support": 29841.0 }, "step": 1134 }, { "epoch": 15.0, "eval_B": { "f1-score": 0.8935681470137825, "precision": 0.8861047835990888, "recall": 0.9011583011583012, "support": 1295.0 }, "eval_I": { "f1-score": 0.9633398694432723, "precision": 0.9595530063291139, "recall": 0.9671567405930726, "support": 20065.0 }, "eval_O": { "f1-score": 0.9100768726535964, "precision": 0.92, "recall": 0.9003655229336163, "support": 8481.0 }, "eval_accuracy": 0.9453101437619382, "eval_loss": 0.39179423451423645, "eval_macro avg": { "f1-score": 0.9223282963702171, "precision": 0.9218859299760677, "recall": 0.9228935215616634, "support": 29841.0 }, "eval_runtime": 4.6645, "eval_samples_per_second": 17.151, "eval_steps_per_second": 2.144, "eval_weighted avg": { "f1-score": 0.945174330208011, "precision": 0.9451243847979119, "recall": 0.9453101437619382, "support": 29841.0 }, "step": 1215 }, { "epoch": 16.0, "eval_B": { "f1-score": 0.9022614028363357, "precision": 0.895738203957382, "recall": 0.9088803088803089, "support": 1295.0 }, "eval_I": { "f1-score": 0.9632045864531594, "precision": 0.9552494853445741, "recall": 0.9712932967854473, "support": 20065.0 }, "eval_O": { "f1-score": 0.9083463808262073, "precision": 0.9282461538461538, "recall": 0.8892819243013795, "support": 8481.0 }, "eval_accuracy": 0.9452766328206159, "eval_loss": 0.44052162766456604, "eval_macro avg": { "f1-score": 0.9246041233719008, "precision": 0.92641128104937, "recall": 0.9231518433223785, "support": 29841.0 }, "eval_runtime": 4.6376, "eval_samples_per_second": 17.25, "eval_steps_per_second": 2.156, "eval_weighted avg": { "f1-score": 0.9449688080038458, "precision": 0.944992377210312, "recall": 0.9452766328206159, "support": 29841.0 }, "step": 1296 }, { "epoch": 17.0, "eval_B": { "f1-score": 0.8923649906890131, "precision": 0.8618705035971223, "recall": 0.9250965250965251, "support": 1295.0 }, "eval_I": { "f1-score": 0.9599605522682445, "precision": 0.9498902171261283, "recall": 0.97024669823075, "support": 20065.0 }, "eval_O": { "f1-score": 0.9001642635517431, "precision": 0.9298642533936652, "recall": 0.8723027944817828, "support": 8481.0 }, "eval_accuracy": 0.9404510572701987, "eval_loss": 0.4657233655452728, "eval_macro avg": { "f1-score": 0.9174966021696669, "precision": 0.9138749913723053, "recall": 0.9225486726030193, "support": 29841.0 }, "eval_runtime": 4.6396, "eval_samples_per_second": 17.243, "eval_steps_per_second": 2.155, "eval_weighted avg": { "f1-score": 0.940032648483192, "precision": 0.9403789498282803, "recall": 0.9404510572701987, "support": 29841.0 }, "step": 1377 }, { "epoch": 18.0, "eval_B": { "f1-score": 0.9014302280633939, "precision": 0.9024767801857585, "recall": 0.9003861003861003, "support": 1295.0 }, "eval_I": { "f1-score": 0.9638021281301453, "precision": 0.9506496024820632, "recall": 0.9773236979815599, "support": 20065.0 }, "eval_O": { "f1-score": 0.9083038653822705, "precision": 0.9404115641964399, "recall": 0.87831623629289, "support": 8481.0 }, "eval_accuracy": 0.9458463188230958, "eval_loss": 0.4731404185295105, "eval_macro avg": { "f1-score": 0.9245120738586032, "precision": 0.9311793156214204, "recall": 0.9186753448868501, "support": 29841.0 }, "eval_runtime": 4.6405, "eval_samples_per_second": 17.24, "eval_steps_per_second": 2.155, "eval_weighted avg": { "f1-score": 0.9453224398840687, "precision": 0.9456493475450943, "recall": 0.9458463188230958, "support": 29841.0 }, "step": 1458 }, { "epoch": 18.52, "grad_norm": 1.548362135887146, "learning_rate": 1.2592592592592593e-05, "loss": 0.0038, "step": 1500 }, { "epoch": 19.0, "eval_B": { "f1-score": 0.8891402714932127, "precision": 0.868828297715549, "recall": 0.9104247104247104, "support": 1295.0 }, "eval_I": { "f1-score": 0.9603099696984749, "precision": 0.9571718572065158, "recall": 0.9634687266384251, "support": 20065.0 }, "eval_O": { "f1-score": 0.9027910305343512, "precision": 0.913358271992277, "recall": 0.8924655111425539, "support": 8481.0 }, "eval_accuracy": 0.9409872323313562, "eval_loss": 0.49517783522605896, "eval_macro avg": { "f1-score": 0.9174137572420129, "precision": 0.9131194756381139, "recall": 0.9221196494018965, "support": 29841.0 }, "eval_runtime": 4.6377, "eval_samples_per_second": 17.25, "eval_steps_per_second": 2.156, "eval_weighted avg": { "f1-score": 0.9408741973642117, "precision": 0.9408859443435835, "recall": 0.9409872323313562, "support": 29841.0 }, "step": 1539 }, { "epoch": 20.0, "eval_B": { "f1-score": 0.899884925201381, "precision": 0.8940548780487805, "recall": 0.9057915057915058, "support": 1295.0 }, "eval_I": { "f1-score": 0.9634953846153845, "precision": 0.951896887159533, "recall": 0.9753800149514079, "support": 20065.0 }, "eval_O": { "f1-score": 0.9073556231003039, "precision": 0.9365039528171665, "recall": 0.8799669850253508, "support": 8481.0 }, "eval_accuracy": 0.9452431218792936, "eval_loss": 0.45907479524612427, "eval_macro avg": { "f1-score": 0.9235786443056897, "precision": 0.9274852393418267, "recall": 0.9203795019227549, "support": 29841.0 }, "eval_runtime": 4.6356, "eval_samples_per_second": 17.258, "eval_steps_per_second": 2.157, "eval_weighted avg": { "f1-score": 0.9447796290324438, "precision": 0.9450119678218422, "recall": 0.9452431218792936, "support": 29841.0 }, "step": 1620 }, { "epoch": 21.0, "eval_B": { "f1-score": 0.8944337811900192, "precision": 0.8893129770992366, "recall": 0.8996138996138996, "support": 1295.0 }, "eval_I": { "f1-score": 0.9624703322784811, "precision": 0.9549624687239366, "recall": 0.9700971841515076, "support": 20065.0 }, "eval_O": { "f1-score": 0.9066089361958025, "precision": 0.9251350024545901, "recall": 0.8888102818063908, "support": 8481.0 }, "eval_accuracy": 0.9439361951677223, "eval_loss": 0.4614206850528717, "eval_macro avg": { "f1-score": 0.9211710165547675, "precision": 0.9231368160925877, "recall": 0.9195071218572659, "support": 29841.0 }, "eval_runtime": 4.6636, "eval_samples_per_second": 17.154, "eval_steps_per_second": 2.144, "eval_weighted avg": { "f1-score": 0.9436416122678664, "precision": 0.9436363458364894, "recall": 0.9439361951677223, "support": 29841.0 }, "step": 1701 }, { "epoch": 22.0, "eval_B": { "f1-score": 0.9011072928598702, "precision": 0.8912386706948641, "recall": 0.9111969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.9635141147970535, "precision": 0.9558585511795576, "recall": 0.9712932967854473, "support": 20065.0 }, "eval_O": { "f1-score": 0.9095068938527304, "precision": 0.9292568897637795, "recall": 0.8905789411625987, "support": 8481.0 }, "eval_accuracy": 0.9457457859991287, "eval_loss": 0.4724768102169037, "eval_macro avg": { "f1-score": 0.9247094338365515, "precision": 0.9254513705460671, "recall": 0.9243563830483191, "support": 29841.0 }, "eval_runtime": 4.6333, "eval_samples_per_second": 17.266, "eval_steps_per_second": 2.158, "eval_weighted avg": { "f1-score": 0.9454566745223489, "precision": 0.9454939040264833, "recall": 0.9457457859991287, "support": 29841.0 }, "step": 1782 }, { "epoch": 23.0, "eval_B": { "f1-score": 0.8956916099773242, "precision": 0.8771280532938565, "recall": 0.915057915057915, "support": 1295.0 }, "eval_I": { "f1-score": 0.9624542808091362, "precision": 0.9609957269204015, "recall": 0.9639172688761525, "support": 20065.0 }, "eval_O": { "f1-score": 0.9084001187295934, "precision": 0.914753706360593, "recall": 0.9021341822898243, "support": 8481.0 }, "eval_accuracy": 0.9442377936396233, "eval_loss": 0.47468113899230957, "eval_macro avg": { "f1-score": 0.9221820031720179, "precision": 0.9176258288582838, "recall": 0.927036455407964, "support": 29841.0 }, "eval_runtime": 4.6476, "eval_samples_per_second": 17.213, "eval_steps_per_second": 2.152, "eval_weighted avg": { "f1-score": 0.9441944702356367, "precision": 0.9442138759866489, "recall": 0.9442377936396233, "support": 29841.0 }, "step": 1863 }, { "epoch": 24.0, "eval_B": { "f1-score": 0.9008390541571321, "precision": 0.8899773926149209, "recall": 0.911969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.9639726399486381, "precision": 0.9553151918559123, "recall": 0.9727884375778719, "support": 20065.0 }, "eval_O": { "f1-score": 0.9101008271448409, "precision": 0.9325661964860184, "recall": 0.8886923711826435, "support": 8481.0 }, "eval_accuracy": 0.9462484501189639, "eval_loss": 0.4712923467159271, "eval_macro avg": { "f1-score": 0.9249708404168704, "precision": 0.9259529269856172, "recall": 0.9244833069098758, "support": 29841.0 }, "eval_runtime": 4.6509, "eval_samples_per_second": 17.201, "eval_steps_per_second": 2.15, "eval_weighted avg": { "f1-score": 0.9459221443892064, "precision": 0.9460143413566277, "recall": 0.9462484501189639, "support": 29841.0 }, "step": 1944 }, { "epoch": 24.69, "grad_norm": 0.04072243347764015, "learning_rate": 1.0123456790123458e-05, "loss": 0.0014, "step": 2000 }, { "epoch": 25.0, "eval_B": { "f1-score": 0.8943768996960487, "precision": 0.8803290949887809, "recall": 0.9088803088803089, "support": 1295.0 }, "eval_I": { "f1-score": 0.9629187495336865, "precision": 0.9610305798252582, "recall": 0.9648143533516073, "support": 20065.0 }, "eval_O": { "f1-score": 0.9089721512974288, "precision": 0.9155502392344498, "recall": 0.9024879141610659, "support": 8481.0 }, "eval_accuracy": 0.9446734358768137, "eval_loss": 0.48565673828125, "eval_macro avg": { "f1-score": 0.922089266842388, "precision": 0.9189699713494962, "recall": 0.925394192130994, "support": 29841.0 }, "eval_runtime": 4.6314, "eval_samples_per_second": 17.274, "eval_steps_per_second": 2.159, "eval_weighted avg": { "f1-score": 0.9446122988389564, "precision": 0.944602605179171, "recall": 0.9446734358768137, "support": 29841.0 }, "step": 2025 }, { "epoch": 26.0, "eval_B": { "f1-score": 0.897679726131609, "precision": 0.8845577211394303, "recall": 0.9111969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.962990450744644, "precision": 0.9560839023431743, "recall": 0.9699975080986792, "support": 20065.0 }, "eval_O": { "f1-score": 0.9077024833142927, "precision": 0.9261349693251534, "recall": 0.8899893880438627, "support": 8481.0 }, "eval_accuracy": 0.9447069468181362, "eval_loss": 0.4857862889766693, "eval_macro avg": { "f1-score": 0.9227908867301818, "precision": 0.9222588642692527, "recall": 0.9237279357798177, "support": 29841.0 }, "eval_runtime": 4.7085, "eval_samples_per_second": 16.991, "eval_steps_per_second": 2.124, "eval_weighted avg": { "f1-score": 0.94444299455515, "precision": 0.9444682290887698, "recall": 0.9447069468181362, "support": 29841.0 }, "step": 2106 }, { "epoch": 27.0, "eval_B": { "f1-score": 0.8986280487804879, "precision": 0.8871331828442438, "recall": 0.9104247104247104, "support": 1295.0 }, "eval_I": { "f1-score": 0.9620497586334943, "precision": 0.9557796360059027, "recall": 0.9684026912534264, "support": 20065.0 }, "eval_O": { "f1-score": 0.9053591790193843, "precision": 0.9219017355169885, "recall": 0.8893998349251268, "support": 8481.0 }, "eval_accuracy": 0.9434335310478872, "eval_loss": 0.4996240735054016, "eval_macro avg": { "f1-score": 0.9220123288111223, "precision": 0.9216048514557116, "recall": 0.9227424122010879, "support": 29841.0 }, "eval_runtime": 4.6631, "eval_samples_per_second": 17.156, "eval_steps_per_second": 2.145, "eval_weighted avg": { "f1-score": 0.9431856481825407, "precision": 0.9431722960745722, "recall": 0.9434335310478872, "support": 29841.0 }, "step": 2187 }, { "epoch": 28.0, "eval_B": { "f1-score": 0.8919434898816342, "precision": 0.8821752265861027, "recall": 0.901930501930502, "support": 1295.0 }, "eval_I": { "f1-score": 0.9604717405427016, "precision": 0.9630706017938568, "recall": 0.9578868676800398, "support": 20065.0 }, "eval_O": { "f1-score": 0.9045243823719267, "precision": 0.9003504672897197, "recall": 0.9087371772196675, "support": 8481.0 }, "eval_accuracy": 0.9414898964511913, "eval_loss": 0.4974842071533203, "eval_macro avg": { "f1-score": 0.9189798709320876, "precision": 0.9151987652232264, "recall": 0.9228515156100698, "support": 29841.0 }, "eval_runtime": 4.6318, "eval_samples_per_second": 17.272, "eval_steps_per_second": 2.159, "eval_weighted avg": { "f1-score": 0.941597251442054, "precision": 0.9417345550251954, "recall": 0.9414898964511913, "support": 29841.0 }, "step": 2268 }, { "epoch": 29.0, "eval_B": { "f1-score": 0.9026415094339624, "precision": 0.8826568265682657, "recall": 0.9235521235521236, "support": 1295.0 }, "eval_I": { "f1-score": 0.963459587838005, "precision": 0.9565730005895068, "recall": 0.9704460503364066, "support": 20065.0 }, "eval_O": { "f1-score": 0.9098789958461262, "precision": 0.929520295202952, "recall": 0.8910505836575876, "support": 8481.0 }, "eval_accuracy": 0.9458463188230958, "eval_loss": 0.4864692687988281, "eval_macro avg": { "f1-score": 0.9253266977060312, "precision": 0.9229167074535748, "recall": 0.9283495858487059, "support": 29841.0 }, "eval_runtime": 4.6138, "eval_samples_per_second": 17.339, "eval_steps_per_second": 2.167, "eval_weighted avg": { "f1-score": 0.9455923443737659, "precision": 0.9456767357277099, "recall": 0.9458463188230958, "support": 29841.0 }, "step": 2349 }, { "epoch": 30.0, "eval_B": { "f1-score": 0.8974650018917897, "precision": 0.8798219584569733, "recall": 0.9158301158301159, "support": 1295.0 }, "eval_I": { "f1-score": 0.9618674357267865, "precision": 0.9515704252828716, "recall": 0.9723897333665587, "support": 20065.0 }, "eval_O": { "f1-score": 0.9045537340619307, "precision": 0.9324070597070973, "recall": 0.87831623629289, "support": 8481.0 }, "eval_accuracy": 0.9431989544586308, "eval_loss": 0.5332404375076294, "eval_macro avg": { "f1-score": 0.921295390560169, "precision": 0.9212664811489807, "recall": 0.9221786951631882, "support": 29841.0 }, "eval_runtime": 4.6482, "eval_samples_per_second": 17.211, "eval_steps_per_second": 2.151, "eval_weighted avg": { "f1-score": 0.9427836699134436, "precision": 0.9430104317173852, "recall": 0.9431989544586308, "support": 29841.0 }, "step": 2430 }, { "epoch": 30.86, "grad_norm": 0.05446575954556465, "learning_rate": 7.654320987654322e-06, "loss": 0.0008, "step": 2500 }, { "epoch": 31.0, "eval_B": { "f1-score": 0.9002674818494459, "precision": 0.8910741301059002, "recall": 0.9096525096525097, "support": 1295.0 }, "eval_I": { "f1-score": 0.9637251998815517, "precision": 0.9544454763184906, "recall": 0.9731871417891852, "support": 20065.0 }, "eval_O": { "f1-score": 0.9096185236684602, "precision": 0.9333746898263028, "recall": 0.8870416224501828, "support": 8481.0 }, "eval_accuracy": 0.9459468516470627, "eval_loss": 0.512050986289978, "eval_macro avg": { "f1-score": 0.9245370684664859, "precision": 0.9262980987502312, "recall": 0.9232937579639593, "support": 29841.0 }, "eval_runtime": 4.6554, "eval_samples_per_second": 17.184, "eval_steps_per_second": 2.148, "eval_weighted avg": { "f1-score": 0.9455938884035581, "precision": 0.945706920855016, "recall": 0.9459468516470627, "support": 29841.0 }, "step": 2511 }, { "epoch": 32.0, "eval_B": { "f1-score": 0.8938120702826584, "precision": 0.8843537414965986, "recall": 0.9034749034749034, "support": 1295.0 }, "eval_I": { "f1-score": 0.9597342259079783, "precision": 0.962041163803896, "recall": 0.9574383254423124, "support": 20065.0 }, "eval_O": { "f1-score": 0.903112155020552, "precision": 0.8995204117440636, "recall": 0.9067326966159651, "support": 8481.0 }, "eval_accuracy": 0.9406856338594551, "eval_loss": 0.5488592982292175, "eval_macro avg": { "f1-score": 0.9188861504037296, "precision": 0.9153051056815195, "recall": 0.9225486418443937, "support": 29841.0 }, "eval_runtime": 4.6459, "eval_samples_per_second": 17.22, "eval_steps_per_second": 2.152, "eval_weighted avg": { "f1-score": 0.9407810750507332, "precision": 0.9409009972509189, "recall": 0.9406856338594551, "support": 29841.0 }, "step": 2592 }, { "epoch": 33.0, "eval_B": { "f1-score": 0.9014084507042254, "precision": 0.8888888888888888, "recall": 0.9142857142857143, "support": 1295.0 }, "eval_I": { "f1-score": 0.963593310640817, "precision": 0.9538994969966303, "recall": 0.9734861699476701, "support": 20065.0 }, "eval_O": { "f1-score": 0.9089808030036942, "precision": 0.9343874501992032, "recall": 0.8849192312227332, "support": 8481.0 }, "eval_accuracy": 0.9457457859991287, "eval_loss": 0.518332839012146, "eval_macro avg": { "f1-score": 0.9246608547829123, "precision": 0.9257252786949075, "recall": 0.9242303718187058, "support": 29841.0 }, "eval_runtime": 4.6621, "eval_samples_per_second": 17.16, "eval_steps_per_second": 2.145, "eval_weighted avg": { "f1-score": 0.945373476490208, "precision": 0.9455328066582199, "recall": 0.9457457859991287, "support": 29841.0 }, "step": 2673 }, { "epoch": 34.0, "eval_B": { "f1-score": 0.9016641452344931, "precision": 0.8836174944403261, "recall": 0.9204633204633205, "support": 1295.0 }, "eval_I": { "f1-score": 0.9637216189536032, "precision": 0.9545343436812516, "recall": 0.9730874657363568, "support": 20065.0 }, "eval_O": { "f1-score": 0.9093110546070954, "precision": 0.934428269254697, "recall": 0.8855087843414692, "support": 8481.0 }, "eval_accuracy": 0.9459133407057404, "eval_loss": 0.5136498808860779, "eval_macro avg": { "f1-score": 0.9248989395983972, "precision": 0.9241933691254248, "recall": 0.9263531901803822, "support": 29841.0 }, "eval_runtime": 4.6341, "eval_samples_per_second": 17.263, "eval_steps_per_second": 2.158, "eval_weighted avg": { "f1-score": 0.9455647064946046, "precision": 0.9457425157606522, "recall": 0.9459133407057404, "support": 29841.0 }, "step": 2754 }, { "epoch": 35.0, "eval_B": { "f1-score": 0.9019157088122605, "precision": 0.8950570342205323, "recall": 0.9088803088803089, "support": 1295.0 }, "eval_I": { "f1-score": 0.9609330316066944, "precision": 0.9589537423069288, "recall": 0.9629205083478695, "support": 20065.0 }, "eval_O": { "f1-score": 0.90479862388042, "precision": 0.9103604678920983, "recall": 0.8993043273198915, "support": 8481.0 }, "eval_accuracy": 0.9424952246908616, "eval_loss": 0.5342629551887512, "eval_macro avg": { "f1-score": 0.922549121433125, "precision": 0.9214570814731865, "recall": 0.9237017148493566, "support": 29841.0 }, "eval_runtime": 4.6532, "eval_samples_per_second": 17.193, "eval_steps_per_second": 2.149, "eval_weighted avg": { "f1-score": 0.9424181244338341, "precision": 0.9423703236117087, "recall": 0.9424952246908616, "support": 29841.0 }, "step": 2835 }, { "epoch": 36.0, "eval_B": { "f1-score": 0.8977099236641222, "precision": 0.8875471698113208, "recall": 0.9081081081081082, "support": 1295.0 }, "eval_I": { "f1-score": 0.9619323959030825, "precision": 0.9573501826438938, "recall": 0.9665586842761027, "support": 20065.0 }, "eval_O": { "f1-score": 0.9061473206284726, "precision": 0.9183821748607411, "recall": 0.894234170498762, "support": 8481.0 }, "eval_accuracy": 0.9434670419892095, "eval_loss": 0.5332928895950317, "eval_macro avg": { "f1-score": 0.9219298800652257, "precision": 0.9210931757719852, "recall": 0.9229669876276576, "support": 29841.0 }, "eval_runtime": 4.6471, "eval_samples_per_second": 17.215, "eval_steps_per_second": 2.152, "eval_weighted avg": { "f1-score": 0.943290885063854, "precision": 0.9432460113484581, "recall": 0.9434670419892095, "support": 29841.0 }, "step": 2916 }, { "epoch": 37.0, "eval_B": { "f1-score": 0.8917982287254526, "precision": 0.8894009216589862, "recall": 0.8942084942084942, "support": 1295.0 }, "eval_I": { "f1-score": 0.9575175655739755, "precision": 0.9608089120835006, "recall": 0.9542486917518066, "support": 20065.0 }, "eval_O": { "f1-score": 0.8977299321319915, "precision": 0.8909534316571827, "recall": 0.9046103053885155, "support": 8481.0 }, "eval_accuracy": 0.937535605375155, "eval_loss": 0.5845798254013062, "eval_macro avg": { "f1-score": 0.9156819088104732, "precision": 0.9137210884665565, "recall": 0.9176891637829389, "support": 29841.0 }, "eval_runtime": 4.6742, "eval_samples_per_second": 17.115, "eval_steps_per_second": 2.139, "eval_weighted avg": { "f1-score": 0.937673543576043, "precision": 0.9378566759957238, "recall": 0.937535605375155, "support": 29841.0 }, "step": 2997 }, { "epoch": 37.04, "grad_norm": 0.020925017073750496, "learning_rate": 5.185185185185185e-06, "loss": 0.0006, "step": 3000 }, { "epoch": 38.0, "eval_B": { "f1-score": 0.8994994224104735, "precision": 0.8970814132104454, "recall": 0.901930501930502, "support": 1295.0 }, "eval_I": { "f1-score": 0.9628343174713442, "precision": 0.9586482881280569, "recall": 0.9670570645402442, "support": 20065.0 }, "eval_O": { "f1-score": 0.9081590082841646, "precision": 0.918173053747891, "recall": 0.8983610423299139, "support": 8481.0 }, "eval_accuracy": 0.9447069468181362, "eval_loss": 0.5537129640579224, "eval_macro avg": { "f1-score": 0.9234975827219941, "precision": 0.9246342516954645, "recall": 0.9224495362668866, "support": 29841.0 }, "eval_runtime": 4.6513, "eval_samples_per_second": 17.2, "eval_steps_per_second": 2.15, "eval_weighted avg": { "f1-score": 0.9445467270313357, "precision": 0.9444731744992745, "recall": 0.9447069468181362, "support": 29841.0 }, "step": 3078 }, { "epoch": 39.0, "eval_B": { "f1-score": 0.8977536793183579, "precision": 0.9005439005439005, "recall": 0.894980694980695, "support": 1295.0 }, "eval_I": { "f1-score": 0.9618782884939938, "precision": 0.9580264003559599, "recall": 0.9657612758534762, "support": 20065.0 }, "eval_O": { "f1-score": 0.9058781532603523, "precision": 0.914254833673592, "recall": 0.8976535785874308, "support": 8481.0 }, "eval_accuracy": 0.9433329982239201, "eval_loss": 0.5526662468910217, "eval_macro avg": { "f1-score": 0.9218367070242347, "precision": 0.9242750448578175, "recall": 0.919465183140534, "support": 29841.0 }, "eval_runtime": 4.6395, "eval_samples_per_second": 17.243, "eval_steps_per_second": 2.155, "eval_weighted avg": { "f1-score": 0.9431799031919275, "precision": 0.9430916966164814, "recall": 0.9433329982239201, "support": 29841.0 }, "step": 3159 }, { "epoch": 40.0, "eval_B": { "f1-score": 0.9007981755986316, "precision": 0.8869760479041916, "recall": 0.915057915057915, "support": 1295.0 }, "eval_I": { "f1-score": 0.9632649027891005, "precision": 0.9550308611737043, "recall": 0.9716421629703463, "support": 20065.0 }, "eval_O": { "f1-score": 0.908520395848419, "precision": 0.9304165121740205, "recall": 0.8876311755689188, "support": 8481.0 }, "eval_accuracy": 0.9453101437619382, "eval_loss": 0.5522081851959229, "eval_macro avg": { "f1-score": 0.9241944914120505, "precision": 0.9241411404173054, "recall": 0.9247770845323934, "support": 29841.0 }, "eval_runtime": 4.6584, "eval_samples_per_second": 17.173, "eval_steps_per_second": 2.147, "eval_weighted avg": { "f1-score": 0.9449953215057797, "precision": 0.9450819560750032, "recall": 0.9453101437619382, "support": 29841.0 }, "step": 3240 }, { "epoch": 41.0, "eval_B": { "f1-score": 0.8909299655568312, "precision": 0.8831562974203339, "recall": 0.8988416988416988, "support": 1295.0 }, "eval_I": { "f1-score": 0.9586475553113918, "precision": 0.9606626294980232, "recall": 0.956640917019686, "support": 20065.0 }, "eval_O": { "f1-score": 0.900311343476473, "precision": 0.897096698665418, "recall": 0.9035491097747907, "support": 8481.0 }, "eval_accuracy": 0.9390435977346604, "eval_loss": 0.5731642246246338, "eval_macro avg": { "f1-score": 0.916629621448232, "precision": 0.9136385418612583, "recall": 0.9196772418787251, "support": 29841.0 }, "eval_runtime": 4.6541, "eval_samples_per_second": 17.189, "eval_steps_per_second": 2.149, "eval_weighted avg": { "f1-score": 0.9391293189485319, "precision": 0.9392332752728989, "recall": 0.9390435977346604, "support": 29841.0 }, "step": 3321 }, { "epoch": 42.0, "eval_B": { "f1-score": 0.8967889908256882, "precision": 0.8879636638909917, "recall": 0.9057915057915058, "support": 1295.0 }, "eval_I": { "f1-score": 0.9603067881866627, "precision": 0.9596376847658389, "recall": 0.9609768253177174, "support": 20065.0 }, "eval_O": { "f1-score": 0.9034776437189497, "precision": 0.906372374510502, "recall": 0.9006013441811107, "support": 8481.0 }, "eval_accuracy": 0.9414228745685467, "eval_loss": 0.554601788520813, "eval_macro avg": { "f1-score": 0.9201911409104335, "precision": 0.9179912410557775, "recall": 0.9224565584301113, "support": 29841.0 }, "eval_runtime": 4.6491, "eval_samples_per_second": 17.208, "eval_steps_per_second": 2.151, "eval_weighted avg": { "f1-score": 0.9413991268544976, "precision": 0.9413889346130814, "recall": 0.9414228745685467, "support": 29841.0 }, "step": 3402 }, { "epoch": 43.0, "eval_B": { "f1-score": 0.8997331300038124, "precision": 0.8885542168674698, "recall": 0.9111969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.9637457002152986, "precision": 0.957137239480928, "recall": 0.9704460503364066, "support": 20065.0 }, "eval_O": { "f1-score": 0.9099099099099098, "precision": 0.9272860815277267, "recall": 0.8931729748850371, "support": 8481.0 }, "eval_accuracy": 0.9459133407057404, "eval_loss": 0.5374415516853333, "eval_macro avg": { "f1-score": 0.9244629133763403, "precision": 0.9243258459587081, "recall": 0.9249386454727849, "support": 29841.0 }, "eval_runtime": 4.6464, "eval_samples_per_second": 17.218, "eval_steps_per_second": 2.152, "eval_weighted avg": { "f1-score": 0.9456672974806759, "precision": 0.9456770777944722, "recall": 0.9459133407057404, "support": 29841.0 }, "step": 3483 }, { "epoch": 43.21, "grad_norm": 0.08381267637014389, "learning_rate": 2.7160493827160496e-06, "loss": 0.0002, "step": 3500 }, { "epoch": 44.0, "eval_B": { "f1-score": 0.9002284843869003, "precision": 0.8880540946656649, "recall": 0.9127413127413128, "support": 1295.0 }, "eval_I": { "f1-score": 0.963930040132785, "precision": 0.9583271760011822, "recall": 0.9695988038873661, "support": 20065.0 }, "eval_O": { "f1-score": 0.910844817255842, "precision": 0.9259349494457303, "recall": 0.8962386511024644, "support": 8481.0 }, "eval_accuracy": 0.9462819610602862, "eval_loss": 0.5376068353652954, "eval_macro avg": { "f1-score": 0.9250011139251758, "precision": 0.9241054067041925, "recall": 0.9261929225770477, "support": 29841.0 }, "eval_runtime": 4.6695, "eval_samples_per_second": 17.132, "eval_steps_per_second": 2.142, "eval_weighted avg": { "f1-score": 0.9460784503767355, "precision": 0.9460714837071478, "recall": 0.9462819610602862, "support": 29841.0 }, "step": 3564 }, { "epoch": 45.0, "eval_B": { "f1-score": 0.9023185100722159, "precision": 0.8884730538922155, "recall": 0.9166023166023166, "support": 1295.0 }, "eval_I": { "f1-score": 0.9641558441558441, "precision": 0.9571709233791749, "recall": 0.9712434587590332, "support": 20065.0 }, "eval_O": { "f1-score": 0.9111030915433657, "precision": 0.9298956414978514, "recall": 0.8930550642612899, "support": 8481.0 }, "eval_accuracy": 0.9466505814148319, "eval_loss": 0.5380018949508667, "eval_macro avg": { "f1-score": 0.9258591485904751, "precision": 0.9251798729230806, "recall": 0.92696694654088, "support": 29841.0 }, "eval_runtime": 4.6294, "eval_samples_per_second": 17.281, "eval_steps_per_second": 2.16, "eval_weighted avg": { "f1-score": 0.9463943836637451, "precision": 0.9464378579114923, "recall": 0.9466505814148319, "support": 29841.0 }, "step": 3645 }, { "epoch": 46.0, "eval_B": { "f1-score": 0.9017517136329019, "precision": 0.8895567242674681, "recall": 0.9142857142857143, "support": 1295.0 }, "eval_I": { "f1-score": 0.9637677572637727, "precision": 0.9572292414335578, "recall": 0.9703962123099925, "support": 20065.0 }, "eval_O": { "f1-score": 0.9103903903903904, "precision": 0.927775737544375, "recall": 0.893644617380026, "support": 8481.0 }, "eval_accuracy": 0.9461479172949968, "eval_loss": 0.5362712144851685, "eval_macro avg": { "f1-score": 0.9253032870956882, "precision": 0.9248539010818003, "recall": 0.926108847991911, "support": 29841.0 }, "eval_runtime": 4.6532, "eval_samples_per_second": 17.193, "eval_steps_per_second": 2.149, "eval_weighted avg": { "f1-score": 0.9459062839567411, "precision": 0.9459216084382076, "recall": 0.9461479172949968, "support": 29841.0 }, "step": 3726 }, { "epoch": 47.0, "eval_B": { "f1-score": 0.9013333333333334, "precision": 0.8894736842105263, "recall": 0.9135135135135135, "support": 1295.0 }, "eval_I": { "f1-score": 0.9637367261565881, "precision": 0.9573620537031573, "recall": 0.9701968602043359, "support": 20065.0 }, "eval_O": { "f1-score": 0.9103133629487334, "precision": 0.9272349272349273, "recall": 0.8939983492512675, "support": 8481.0 }, "eval_accuracy": 0.9460808954123522, "eval_loss": 0.5367923974990845, "eval_macro avg": { "f1-score": 0.9251278074795518, "precision": 0.9246902217162036, "recall": 0.9259029076563724, "support": 29841.0 }, "eval_runtime": 4.6611, "eval_samples_per_second": 17.164, "eval_steps_per_second": 2.145, "eval_weighted avg": { "f1-score": 0.9458453707371339, "precision": 0.9458536056595257, "recall": 0.9460808954123522, "support": 29841.0 }, "step": 3807 }, { "epoch": 48.0, "eval_B": { "f1-score": 0.9012158054711246, "precision": 0.887060583395662, "recall": 0.9158301158301159, "support": 1295.0 }, "eval_I": { "f1-score": 0.9645930175056869, "precision": 0.957161784189607, "recall": 0.972140543234488, "support": 20065.0 }, "eval_O": { "f1-score": 0.9119595326990244, "precision": 0.9319384615384615, "recall": 0.8928192430137956, "support": 8481.0 }, "eval_accuracy": 0.9471532455346671, "eval_loss": 0.5329636931419373, "eval_macro avg": { "f1-score": 0.9259227852252786, "precision": 0.9253869430412435, "recall": 0.9269299673594665, "support": 29841.0 }, "eval_runtime": 4.6306, "eval_samples_per_second": 17.276, "eval_steps_per_second": 2.16, "eval_weighted avg": { "f1-score": 0.9468838899888457, "precision": 0.9469509985446042, "recall": 0.9471532455346671, "support": 29841.0 }, "step": 3888 }, { "epoch": 49.0, "eval_B": { "f1-score": 0.9007981755986316, "precision": 0.8869760479041916, "recall": 0.915057915057915, "support": 1295.0 }, "eval_I": { "f1-score": 0.9646663205004574, "precision": 0.9572578270684071, "recall": 0.9721903812609021, "support": 20065.0 }, "eval_O": { "f1-score": 0.9120905587668594, "precision": 0.9319552110249785, "recall": 0.8930550642612899, "support": 8481.0 }, "eval_accuracy": 0.9472202674173118, "eval_loss": 0.5337651371955872, "eval_macro avg": { "f1-score": 0.9258516849553162, "precision": 0.9253963619991925, "recall": 0.9267677868600357, "support": 29841.0 }, "eval_runtime": 4.6446, "eval_samples_per_second": 17.224, "eval_steps_per_second": 2.153, "eval_weighted avg": { "f1-score": 0.9469522933931048, "precision": 0.9470166692425308, "recall": 0.9472202674173118, "support": 29841.0 }, "step": 3969 } ], "logging_steps": 500, "max_steps": 4050, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "total_flos": 7045545984044400.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }