{ "best_metric": null, "best_model_checkpoint": null, "epoch": 10.0, "eval_steps": 500, "global_step": 810, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_Claim": { "f1-score": 0.38183790485045715, "precision": 0.6497890295358649, "recall": 0.27035330261136714, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.6266258607498087, "precision": 0.5535653937140926, "recall": 0.7219039224327898, "support": 2269.0 }, "eval_O": { "f1-score": 0.8545803971812939, "precision": 0.8443037974683544, "recall": 0.8651102464332037, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.878949075575738, "precision": 0.8314310260186549, "recall": 0.9322278794550709, "support": 14534.0 }, "eval_accuracy": 0.7960859220535504, "eval_loss": 0.5359914898872375, "eval_macro avg": { "f1-score": 0.6854983095893245, "precision": 0.7197723116842417, "recall": 0.697398837733108, "support": 29841.0 }, "eval_runtime": 4.8191, "eval_samples_per_second": 16.601, "eval_steps_per_second": 2.075, "eval_weighted avg": { "f1-score": 0.7769240850962494, "precision": 0.7862232339538372, "recall": 0.7960859220535504, "support": 29841.0 }, "step": 81 }, { "epoch": 2.0, "eval_Claim": { "f1-score": 0.6161300742974051, "precision": 0.6048625792811839, "recall": 0.6278253236778583, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.7920215150156881, "precision": 0.8057455540355677, "recall": 0.7787571617452622, "support": 2269.0 }, "eval_O": { "f1-score": 0.8922796352583586, "precision": 0.9209436566695947, "recall": 0.865346067680698, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8914289590611538, "precision": 0.8790554552143957, "recall": 0.9041557726709784, "support": 14534.0 }, "eval_accuracy": 0.8413927147213566, "eval_loss": 0.443877637386322, "eval_macro avg": { "f1-score": 0.7979650459081514, "precision": 0.8026518113001855, "recall": 0.7940210814436992, "support": 29841.0 }, "eval_runtime": 4.8087, "eval_samples_per_second": 16.637, "eval_steps_per_second": 2.08, "eval_weighted avg": { "f1-score": 0.842071433389123, "precision": 0.8435143116581857, "recall": 0.8413927147213566, "support": 29841.0 }, "step": 162 }, { "epoch": 3.0, "eval_Claim": { "f1-score": 0.6042799305957202, "precision": 0.6389432485322897, "recall": 0.5731841123546193, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8349557522123894, "precision": 0.8382940915148823, "recall": 0.8316438959894227, "support": 2269.0 }, "eval_O": { "f1-score": 0.8941106484235574, "precision": 0.9022691799735862, "recall": 0.8860983374602052, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8917763490086511, "precision": 0.8729980887102089, "recall": 0.9113802119168846, "support": 14534.0 }, "eval_accuracy": 0.8464863778023525, "eval_loss": 0.4555923044681549, "eval_macro avg": { "f1-score": 0.8062806700600795, "precision": 0.8131261521827418, "recall": 0.8005766394302829, "support": 29841.0 }, "eval_runtime": 4.7811, "eval_samples_per_second": 16.733, "eval_steps_per_second": 2.092, "eval_weighted avg": { "f1-score": 0.8442159482345275, "precision": 0.8429359878649869, "recall": 0.8464863778023525, "support": 29841.0 }, "step": 243 }, { "epoch": 4.0, "eval_Claim": { "f1-score": 0.6278026905829596, "precision": 0.5981717011128775, "recall": 0.6605222734254992, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8182207014542344, "precision": 0.7947652679684254, "recall": 0.8431026884089907, "support": 2269.0 }, "eval_O": { "f1-score": 0.9069328626209752, "precision": 0.9373427277302466, "recall": 0.8784341469166372, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.888919552918449, "precision": 0.8913795489137954, "recall": 0.8864730975643319, "support": 14534.0 }, "eval_accuracy": 0.8463858449783854, "eval_loss": 0.4377317428588867, "eval_macro avg": { "f1-score": 0.8104689518941546, "precision": 0.8054148114313363, "recall": 0.8171330515788647, "support": 29841.0 }, "eval_runtime": 4.8109, "eval_samples_per_second": 16.629, "eval_steps_per_second": 2.079, "eval_weighted avg": { "f1-score": 0.8487883791626096, "precision": 0.8523207959781866, "recall": 0.8463858449783854, "support": 29841.0 }, "step": 324 }, { "epoch": 5.0, "eval_Claim": { "f1-score": 0.6247990569070839, "precision": 0.6105990783410138, "recall": 0.6396752249286811, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.7998289136013687, "precision": 0.7769007062733694, "recall": 0.8241516086381666, "support": 2269.0 }, "eval_O": { "f1-score": 0.9028039585296891, "precision": 0.9020600353148911, "recall": 0.9035491097747907, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8885327014878567, "precision": 0.9001058948111542, "recall": 0.8772533370028898, "support": 14534.0 }, "eval_accuracy": 0.8444086994403672, "eval_loss": 0.5236712694168091, "eval_macro avg": { "f1-score": 0.8039911576314996, "precision": 0.7974164286851071, "recall": 0.8111573200861321, "support": 29841.0 }, "eval_runtime": 4.8153, "eval_samples_per_second": 16.614, "eval_steps_per_second": 2.077, "eval_weighted avg": { "f1-score": 0.8455693764619782, "precision": 0.8470828034323642, "recall": 0.8444086994403672, "support": 29841.0 }, "step": 405 }, { "epoch": 6.0, "eval_Claim": { "f1-score": 0.6166529266281945, "precision": 0.5813095006800078, "recall": 0.6565723063418916, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8074107959743824, "precision": 0.8392772230147408, "recall": 0.7778757161745262, "support": 2269.0 }, "eval_O": { "f1-score": 0.8913107165875667, "precision": 0.8858607034707664, "recall": 0.8968282042212004, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8815305371596762, "precision": 0.8981792217065334, "recall": 0.865487821659557, "support": 14534.0 }, "eval_accuracy": 0.8358298984618477, "eval_loss": 0.5537309050559998, "eval_macro avg": { "f1-score": 0.7992262440874549, "precision": 0.8011566622180121, "recall": 0.7991910120992938, "support": 29841.0 }, "eval_runtime": 4.7996, "eval_samples_per_second": 16.668, "eval_steps_per_second": 2.084, "eval_weighted avg": { "f1-score": 0.838225042631562, "precision": 0.8418105575563007, "recall": 0.8358298984618477, "support": 29841.0 }, "step": 486 }, { "epoch": 6.17, "grad_norm": 6.804128646850586, "learning_rate": 1.7530864197530865e-05, "loss": 0.3426, "step": 500 }, { "epoch": 7.0, "eval_Claim": { "f1-score": 0.6206536493682782, "precision": 0.5920318725099601, "recall": 0.652183454026772, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8364370652905541, "precision": 0.8519195612431444, "recall": 0.8215072719259586, "support": 2269.0 }, "eval_O": { "f1-score": 0.9008658773634918, "precision": 0.9000706214689266, "recall": 0.9016625397948355, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8854242963272995, "precision": 0.8978566881233642, "recall": 0.8733314985551122, "support": 14534.0 }, "eval_accuracy": 0.8436714587312758, "eval_loss": 0.5738794207572937, "eval_macro avg": { "f1-score": 0.8108452220874058, "precision": 0.8104696858363488, "recall": 0.8121711910756696, "support": 29841.0 }, "eval_runtime": 4.8167, "eval_samples_per_second": 16.609, "eval_steps_per_second": 2.076, "eval_weighted avg": { "f1-score": 0.8456551258354699, "precision": 0.8482906998207675, "recall": 0.8436714587312758, "support": 29841.0 }, "step": 567 }, { "epoch": 8.0, "eval_Claim": { "f1-score": 0.6410105757931845, "precision": 0.5787798408488064, "recall": 0.7182356813693219, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8115942028985507, "precision": 0.8804123711340206, "recall": 0.75275451740855, "support": 2269.0 }, "eval_O": { "f1-score": 0.8960937967338637, "precision": 0.9094220495386109, "recall": 0.8831505718665251, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.891816143497758, "precision": 0.9084939329050679, "recall": 0.8757396449704142, "support": 14534.0 }, "eval_accuracy": 0.8444422103816897, "eval_loss": 0.5891872644424438, "eval_macro avg": { "f1-score": 0.8101286797308392, "precision": 0.8192770486066265, "recall": 0.8074701039037029, "support": 29841.0 }, "eval_runtime": 4.799, "eval_samples_per_second": 16.67, "eval_steps_per_second": 2.084, "eval_weighted avg": { "f1-score": 0.8486317402219317, "precision": 0.8562720628608399, "recall": 0.8444422103816897, "support": 29841.0 }, "step": 648 }, { "epoch": 9.0, "eval_Claim": { "f1-score": 0.6284997910572503, "precision": 0.5998005982053839, "recall": 0.6600833881939873, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.816712834718375, "precision": 0.857489093553078, "recall": 0.7796386073159982, "support": 2269.0 }, "eval_O": { "f1-score": 0.8971996170416466, "precision": 0.9108249301421455, "recall": 0.8839759462327555, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8942406935938898, "precision": 0.8943022295623452, "recall": 0.8941791660932985, "support": 14534.0 }, "eval_accuracy": 0.8468214872155759, "eval_loss": 0.7009620070457458, "eval_macro avg": { "f1-score": 0.8091632341027905, "precision": 0.8156042128657381, "recall": 0.8044692769590099, "support": 29841.0 }, "eval_runtime": 4.8005, "eval_samples_per_second": 16.665, "eval_steps_per_second": 2.083, "eval_weighted avg": { "f1-score": 0.848605581671113, "precision": 0.8512257939173797, "recall": 0.8468214872155759, "support": 29841.0 }, "step": 729 }, { "epoch": 10.0, "eval_Claim": { "f1-score": 0.6189745836985101, "precision": 0.6180266900021877, "recall": 0.619925389510643, "support": 4557.0 }, "eval_MajorClaim": { "f1-score": 0.8208921766420085, "precision": 0.8353102189781022, "recall": 0.8069634200088145, "support": 2269.0 }, "eval_O": { "f1-score": 0.8951902368987796, "precision": 0.9085610200364299, "recall": 0.8822072868765476, "support": 8481.0 }, "eval_Premise": { "f1-score": 0.8963474827245805, "precision": 0.8870174493027017, "recall": 0.905875877253337, "support": 14534.0 }, "eval_accuracy": 0.8479608592205355, "eval_loss": 0.7416248917579651, "eval_macro avg": { "f1-score": 0.8078511199909697, "precision": 0.8122288445798553, "recall": 0.8037429934123356, "support": 29841.0 }, "eval_runtime": 4.7804, "eval_samples_per_second": 16.735, "eval_steps_per_second": 2.092, "eval_weighted avg": { "f1-score": 0.8479238041544329, "precision": 0.8481312332795722, "recall": 0.8479608592205355, "support": 29841.0 }, "step": 810 } ], "logging_steps": 500, "max_steps": 4050, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "total_flos": 1437887327268000.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }