diff --git "a/checkpoint-3888/trainer_state.json" "b/checkpoint-3888/trainer_state.json" --- "a/checkpoint-3888/trainer_state.json" +++ "b/checkpoint-3888/trainer_state.json" @@ -11,2209 +11,2209 @@ { "epoch": 1.0, "eval_Claim": { - "f1-score": 0.44734338904742493, - "precision": 0.5477537437603993, - "recall": 0.3780431786862655, - "support": 4354.0 + "f1-score": 0.38183790485045715, + "precision": 0.6497890295358649, + "recall": 0.27035330261136714, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.6504965622612681, - "precision": 0.5898856944925528, - "recall": 0.7249893571732652, - "support": 2349.0 + "f1-score": 0.6266258607498087, + "precision": 0.5535653937140926, + "recall": 0.7219039224327898, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.8859784283513097, - "precision": 0.8689081979599547, - "recall": 0.9037328094302554, - "support": 10180.0 + "f1-score": 0.8545803971812939, + "precision": 0.8443037974683544, + "recall": 0.8651102464332037, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8720120805863504, - "precision": 0.859258183929738, - "recall": 0.8851502916105877, - "support": 13374.0 + "f1-score": 0.878949075575738, + "precision": 0.8314310260186549, + "recall": 0.9322278794550709, + "support": 14534.0 }, - "eval_accuracy": 0.8059953068711373, - "eval_loss": 0.47828415036201477, + "eval_accuracy": 0.7960859220535504, + "eval_loss": 0.5359914898872375, "eval_macro avg": { - "f1-score": 0.7139576150615883, - "precision": 0.7164514550356611, - "recall": 0.7229789092250934, - "support": 30257.0 - }, - "eval_runtime": 4.8422, - "eval_samples_per_second": 16.728, - "eval_steps_per_second": 2.272, + "f1-score": 0.6854983095893245, + "precision": 0.7197723116842417, + "recall": 0.697398837733108, + "support": 29841.0 + }, + "eval_runtime": 4.8191, + "eval_samples_per_second": 16.601, + "eval_steps_per_second": 2.075, "eval_weighted avg": { - "f1-score": 0.7984036588902531, - "precision": 0.7967665566250599, - "recall": 0.8059953068711373, - "support": 30257.0 + "f1-score": 0.7769240850962494, + "precision": 0.7862232339538372, + "recall": 0.7960859220535504, + "support": 29841.0 }, "step": 81 }, { "epoch": 2.0, "eval_Claim": { - "f1-score": 0.5787561000934482, - "precision": 0.5281409891984082, - "recall": 0.6401010564997703, - "support": 4354.0 + "f1-score": 0.6161300742974051, + "precision": 0.6048625792811839, + "recall": 0.6278253236778583, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7702650787552824, - "precision": 0.7017850892544627, - "recall": 0.8535547041294168, - "support": 2349.0 + "f1-score": 0.7920215150156881, + "precision": 0.8057455540355677, + "recall": 0.7787571617452622, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9095337508698677, - "precision": 0.9206077681626081, - "recall": 0.8987229862475442, - "support": 10180.0 + "f1-score": 0.8922796352583586, + "precision": 0.9209436566695947, + "recall": 0.865346067680698, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8736648538675224, - "precision": 0.9162905211325401, - "recall": 0.8348287722446538, - "support": 13374.0 + "f1-score": 0.8914289590611538, + "precision": 0.8790554552143957, + "recall": 0.9041557726709784, + "support": 14534.0 }, - "eval_accuracy": 0.8297584030141786, - "eval_loss": 0.4241589605808258, + "eval_accuracy": 0.8413927147213566, + "eval_loss": 0.443877637386322, "eval_macro avg": { - "f1-score": 0.7830549458965301, - "precision": 0.7667060919370048, - "recall": 0.8068018797803463, - "support": 30257.0 - }, - "eval_runtime": 4.8636, - "eval_samples_per_second": 16.654, - "eval_steps_per_second": 2.262, + "f1-score": 0.7979650459081514, + "precision": 0.8026518113001855, + "recall": 0.7940210814436992, + "support": 29841.0 + }, + "eval_runtime": 4.8087, + "eval_samples_per_second": 16.637, + "eval_steps_per_second": 2.08, "eval_weighted avg": { - "f1-score": 0.8352680063880269, - "precision": 0.8452350051608073, - "recall": 0.8297584030141786, - "support": 30257.0 + "f1-score": 0.842071433389123, + "precision": 0.8435143116581857, + "recall": 0.8413927147213566, + "support": 29841.0 }, "step": 162 }, { "epoch": 3.0, "eval_Claim": { - "f1-score": 0.5728465083303793, - "precision": 0.5899245558530056, - "recall": 0.5567294441892513, - "support": 4354.0 + "f1-score": 0.6042799305957202, + "precision": 0.6389432485322897, + "recall": 0.5731841123546193, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7862876979822088, - "precision": 0.8017699115044248, - "recall": 0.7713920817369093, - "support": 2349.0 + "f1-score": 0.8349557522123894, + "precision": 0.8382940915148823, + "recall": 0.8316438959894227, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.914532821534425, - "precision": 0.9048168445341794, - "recall": 0.9244597249508841, - "support": 10180.0 + "f1-score": 0.8941106484235574, + "precision": 0.9022691799735862, + "recall": 0.8860983374602052, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8880533114924986, - "precision": 0.8843330614665975, - "recall": 0.8918049947659639, - "support": 13374.0 + "f1-score": 0.8917763490086511, + "precision": 0.8729980887102089, + "recall": 0.9113802119168846, + "support": 14534.0 }, - "eval_accuracy": 0.8452258981392735, - "eval_loss": 0.41067537665367126, + "eval_accuracy": 0.8464863778023525, + "eval_loss": 0.4555923044681549, "eval_macro avg": { - "f1-score": 0.7904300848348779, - "precision": 0.7952110933395518, - "recall": 0.7860965614107521, - "support": 30257.0 - }, - "eval_runtime": 4.8684, - "eval_samples_per_second": 16.638, - "eval_steps_per_second": 2.259, + "f1-score": 0.8062806700600795, + "precision": 0.8131261521827418, + "recall": 0.8005766394302829, + "support": 29841.0 + }, + "eval_runtime": 4.7811, + "eval_samples_per_second": 16.733, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8437033615676307, - "precision": 0.8424495118392472, - "recall": 0.8452258981392735, - "support": 30257.0 + "f1-score": 0.8442159482345275, + "precision": 0.8429359878649869, + "recall": 0.8464863778023525, + "support": 29841.0 }, "step": 243 }, { "epoch": 4.0, "eval_Claim": { - "f1-score": 0.5865384615384616, - "precision": 0.5714596949891068, - "recall": 0.6024345429490124, - "support": 4354.0 + "f1-score": 0.6278026905829596, + "precision": 0.5981717011128775, + "recall": 0.6605222734254992, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7783630470016208, - "precision": 0.7425589485890993, - "recall": 0.8177948063005535, - "support": 2349.0 + "f1-score": 0.8182207014542344, + "precision": 0.7947652679684254, + "recall": 0.8431026884089907, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9108591535529275, - "precision": 0.9063411787589963, - "recall": 0.9154223968565816, - "support": 10180.0 + "f1-score": 0.9069328626209752, + "precision": 0.9373427277302466, + "recall": 0.8784341469166372, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8868256151612411, - "precision": 0.9067823097358962, - "recall": 0.8677284282937042, - "support": 13374.0 + "f1-score": 0.888919552918449, + "precision": 0.8913795489137954, + "recall": 0.8864730975643319, + "support": 14534.0 }, - "eval_accuracy": 0.8417225765938461, - "eval_loss": 0.4545813202857971, + "eval_accuracy": 0.8463858449783854, + "eval_loss": 0.4377317428588867, "eval_macro avg": { - "f1-score": 0.7906465693135627, - "precision": 0.7817855330182747, - "recall": 0.8008450435999629, - "support": 30257.0 - }, - "eval_runtime": 4.9112, - "eval_samples_per_second": 16.493, - "eval_steps_per_second": 2.24, + "f1-score": 0.8104689518941546, + "precision": 0.8054148114313363, + "recall": 0.8171330515788647, + "support": 29841.0 + }, + "eval_runtime": 4.8109, + "eval_samples_per_second": 16.629, + "eval_steps_per_second": 2.079, "eval_weighted avg": { - "f1-score": 0.8432797441676475, - "precision": 0.8456313015960876, - "recall": 0.8417225765938461, - "support": 30257.0 + "f1-score": 0.8487883791626096, + "precision": 0.8523207959781866, + "recall": 0.8463858449783854, + "support": 29841.0 }, "step": 324 }, { "epoch": 5.0, "eval_Claim": { - "f1-score": 0.597399608790703, - "precision": 0.5985704403965875, - "recall": 0.5962333486449242, - "support": 4354.0 + "f1-score": 0.6247990569070839, + "precision": 0.6105990783410138, + "recall": 0.6396752249286811, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7933532168726033, - "precision": 0.7940298507462686, - "recall": 0.7926777352064709, - "support": 2349.0 + "f1-score": 0.7998289136013687, + "precision": 0.7769007062733694, + "recall": 0.8241516086381666, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9101112629318758, - "precision": 0.9042862684251358, - "recall": 0.9160117878192534, - "support": 10180.0 + "f1-score": 0.9028039585296891, + "precision": 0.9020600353148911, + "recall": 0.9035491097747907, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8923677591320345, - "precision": 0.8961019377214808, - "recall": 0.8886645730521908, - "support": 13374.0 + "f1-score": 0.8885327014878567, + "precision": 0.9001058948111542, + "recall": 0.8772533370028898, + "support": 14534.0 }, - "eval_accuracy": 0.848332617245596, - "eval_loss": 0.48704993724823, + "eval_accuracy": 0.8444086994403672, + "eval_loss": 0.5236712694168091, "eval_macro avg": { - "f1-score": 0.7983079619318041, - "precision": 0.7982471243223681, - "recall": 0.7983968611807098, - "support": 30257.0 - }, - "eval_runtime": 4.8769, - "eval_samples_per_second": 16.609, - "eval_steps_per_second": 2.256, + "f1-score": 0.8039911576314996, + "precision": 0.7974164286851071, + "recall": 0.8111573200861321, + "support": 29841.0 + }, + "eval_runtime": 4.8153, + "eval_samples_per_second": 16.614, + "eval_steps_per_second": 2.077, "eval_weighted avg": { - "f1-score": 0.8482045037639816, - "precision": 0.8481162489521332, - "recall": 0.848332617245596, - "support": 30257.0 + "f1-score": 0.8455693764619782, + "precision": 0.8470828034323642, + "recall": 0.8444086994403672, + "support": 29841.0 }, "step": 405 }, { "epoch": 6.0, "eval_Claim": { - "f1-score": 0.6060809300245921, - "precision": 0.5903745644599303, - "recall": 0.6226458429030777, - "support": 4354.0 + "f1-score": 0.6166529266281945, + "precision": 0.5813095006800078, + "recall": 0.6565723063418916, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7858529221479404, - "precision": 0.7963286713286714, - "recall": 0.7756492124308216, - "support": 2349.0 + "f1-score": 0.8074107959743824, + "precision": 0.8392772230147408, + "recall": 0.7778757161745262, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9135615470059578, - "precision": 0.9398504051527115, - "recall": 0.8887033398821218, - "support": 10180.0 + "f1-score": 0.8913107165875667, + "precision": 0.8858607034707664, + "recall": 0.8968282042212004, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.895557603686636, - "precision": 0.88328121591157, - "recall": 0.908180050844923, - "support": 13374.0 + "f1-score": 0.8815305371596762, + "precision": 0.8981792217065334, + "recall": 0.865487821659557, + "support": 14534.0 }, - "eval_accuracy": 0.8502495290346036, - "eval_loss": 0.5423789024353027, + "eval_accuracy": 0.8358298984618477, + "eval_loss": 0.5537309050559998, "eval_macro avg": { - "f1-score": 0.8002632507162816, - "precision": 0.8024587142132208, - "recall": 0.7987946115152361, - "support": 30257.0 - }, - "eval_runtime": 4.867, - "eval_samples_per_second": 16.643, - "eval_steps_per_second": 2.26, + "f1-score": 0.7992262440874549, + "precision": 0.8011566622180121, + "recall": 0.7991910120992938, + "support": 29841.0 + }, + "eval_runtime": 4.7996, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 2.084, "eval_weighted avg": { - "f1-score": 0.8514422719925407, - "precision": 0.8534139871324166, - "recall": 0.8502495290346036, - "support": 30257.0 + "f1-score": 0.838225042631562, + "precision": 0.8418105575563007, + "recall": 0.8358298984618477, + "support": 29841.0 }, "step": 486 }, { "epoch": 6.17, - "grad_norm": 4.494631767272949, + "grad_norm": 6.804128646850586, "learning_rate": 1.7530864197530865e-05, - "loss": 0.35, + "loss": 0.3426, "step": 500 }, { "epoch": 7.0, "eval_Claim": { - "f1-score": 0.6040515653775324, - "precision": 0.6054453161052146, - "recall": 0.6026642168121268, - "support": 4354.0 + "f1-score": 0.6206536493682782, + "precision": 0.5920318725099601, + "recall": 0.652183454026772, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8052777186635455, - "precision": 0.8051063829787234, - "recall": 0.8054491272882077, - "support": 2349.0 + "f1-score": 0.8364370652905541, + "precision": 0.8519195612431444, + "recall": 0.8215072719259586, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9184720354599332, - "precision": 0.9315082331548641, - "recall": 0.9057956777996071, - "support": 10180.0 + "f1-score": 0.9008658773634918, + "precision": 0.9000706214689266, + "recall": 0.9016625397948355, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8908606921029282, - "precision": 0.8810881965774463, - "recall": 0.9008524001794527, - "support": 13374.0 + "f1-score": 0.8854242963272995, + "precision": 0.8978566881233642, + "recall": 0.8733314985551122, + "support": 14534.0 }, - "eval_accuracy": 0.8521994910268698, - "eval_loss": 0.5764245986938477, + "eval_accuracy": 0.8436714587312758, + "eval_loss": 0.5738794207572937, "eval_macro avg": { - "f1-score": 0.8046655029009848, - "precision": 0.8057870322040621, - "recall": 0.8036903555198486, - "support": 30257.0 - }, - "eval_runtime": 4.8398, - "eval_samples_per_second": 16.736, - "eval_steps_per_second": 2.273, + "f1-score": 0.8108452220874058, + "precision": 0.8104696858363488, + "recall": 0.8121711910756696, + "support": 29841.0 + }, + "eval_runtime": 4.8167, + "eval_samples_per_second": 16.609, + "eval_steps_per_second": 2.076, "eval_weighted avg": { - "f1-score": 0.8522343290465387, - "precision": 0.8524880574571969, - "recall": 0.8521994910268698, - "support": 30257.0 + "f1-score": 0.8456551258354699, + "precision": 0.8482906998207675, + "recall": 0.8436714587312758, + "support": 29841.0 }, "step": 567 }, { "epoch": 8.0, "eval_Claim": { - "f1-score": 0.597346719254213, - "precision": 0.6227261400448543, - "recall": 0.5739549839228296, - "support": 4354.0 + "f1-score": 0.6410105757931845, + "precision": 0.5787798408488064, + "recall": 0.7182356813693219, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8047001620745543, - "precision": 0.7676845767298028, - "recall": 0.8454661558109834, - "support": 2349.0 + "f1-score": 0.8115942028985507, + "precision": 0.8804123711340206, + "recall": 0.75275451740855, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9099175618286286, - "precision": 0.9258769700050838, - "recall": 0.8944990176817289, - "support": 10180.0 + "f1-score": 0.8960937967338637, + "precision": 0.9094220495386109, + "recall": 0.8831505718665251, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8942491542873952, - "precision": 0.8797569092750688, - "recall": 0.9092268580828473, - "support": 13374.0 + "f1-score": 0.891816143497758, + "precision": 0.9084939329050679, + "recall": 0.8757396449704142, + "support": 14534.0 }, - "eval_accuracy": 0.8510757841160723, - "eval_loss": 0.5954988598823547, + "eval_accuracy": 0.8444422103816897, + "eval_loss": 0.5891872644424438, "eval_macro avg": { - "f1-score": 0.8015533993611977, - "precision": 0.7990111490137024, - "recall": 0.8057867538745973, - "support": 30257.0 - }, - "eval_runtime": 4.8609, - "eval_samples_per_second": 16.663, - "eval_steps_per_second": 2.263, + "f1-score": 0.8101286797308392, + "precision": 0.8192770486066265, + "recall": 0.8074701039037029, + "support": 29841.0 + }, + "eval_runtime": 4.799, + "eval_samples_per_second": 16.67, + "eval_steps_per_second": 2.084, "eval_weighted avg": { - "f1-score": 0.8498442431569896, - "precision": 0.8495864475589161, - "recall": 0.8510757841160723, - "support": 30257.0 + "f1-score": 0.8486317402219317, + "precision": 0.8562720628608399, + "recall": 0.8444422103816897, + "support": 29841.0 }, "step": 648 }, { "epoch": 9.0, "eval_Claim": { - "f1-score": 0.6049033474776048, - "precision": 0.6213075060532688, - "recall": 0.5893431327514929, - "support": 4354.0 + "f1-score": 0.6284997910572503, + "precision": 0.5998005982053839, + "recall": 0.6600833881939873, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.823503227242377, - "precision": 0.8628731343283582, - "recall": 0.787569178373776, - "support": 2349.0 + "f1-score": 0.816712834718375, + "precision": 0.857489093553078, + "recall": 0.7796386073159982, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9189658498938837, - "precision": 0.9027672479150872, - "recall": 0.9357563850687622, - "support": 10180.0 + "f1-score": 0.8971996170416466, + "precision": 0.9108249301421455, + "recall": 0.8839759462327555, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8989367655288193, - "precision": 0.8970292606656243, - "recall": 0.9008524001794527, - "support": 13374.0 + "f1-score": 0.8942406935938898, + "precision": 0.8943022295623452, + "recall": 0.8941791660932985, + "support": 14534.0 }, - "eval_accuracy": 0.8589747826949136, - "eval_loss": 0.5689579844474792, + "eval_accuracy": 0.8468214872155759, + "eval_loss": 0.7009620070457458, "eval_macro avg": { - "f1-score": 0.8115772975356712, - "precision": 0.8209942872405847, - "recall": 0.803380274093371, - "support": 30257.0 - }, - "eval_runtime": 4.8593, - "eval_samples_per_second": 16.669, - "eval_steps_per_second": 2.264, + "f1-score": 0.8091632341027905, + "precision": 0.8156042128657381, + "recall": 0.8044692769590099, + "support": 29841.0 + }, + "eval_runtime": 4.8005, + "eval_samples_per_second": 16.665, + "eval_steps_per_second": 2.083, "eval_weighted avg": { - "f1-score": 0.8575077142417292, - "precision": 0.8566315824374819, - "recall": 0.8589747826949136, - "support": 30257.0 + "f1-score": 0.848605581671113, + "precision": 0.8512257939173797, + "recall": 0.8468214872155759, + "support": 29841.0 }, "step": 729 }, { "epoch": 10.0, "eval_Claim": { - "f1-score": 0.60162224797219, - "precision": 0.6071094480823199, - "recall": 0.5962333486449242, - "support": 4354.0 + "f1-score": 0.6189745836985101, + "precision": 0.6180266900021877, + "recall": 0.619925389510643, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8131676477000218, - "precision": 0.8333333333333334, - "recall": 0.7939548744146445, - "support": 2349.0 + "f1-score": 0.8208921766420085, + "precision": 0.8353102189781022, + "recall": 0.8069634200088145, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9197247706422018, - "precision": 0.9338801134062373, - "recall": 0.905992141453831, - "support": 10180.0 + "f1-score": 0.8951902368987796, + "precision": 0.9085610200364299, + "recall": 0.8822072868765476, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9008479864909512, - "precision": 0.884834499170693, - "recall": 0.9174517720951099, - "support": 13374.0 + "f1-score": 0.8963474827245805, + "precision": 0.8870174493027017, + "recall": 0.905875877253337, + "support": 14534.0 }, - "eval_accuracy": 0.8577849753775986, - "eval_loss": 0.7088457942008972, + "eval_accuracy": 0.8479608592205355, + "eval_loss": 0.7416248917579651, "eval_macro avg": { - "f1-score": 0.8088406632013413, - "precision": 0.8147893484981459, - "recall": 0.8034080341521274, - "support": 30257.0 - }, - "eval_runtime": 4.9043, - "eval_samples_per_second": 16.516, - "eval_steps_per_second": 2.243, + "f1-score": 0.8078511199909697, + "precision": 0.8122288445798553, + "recall": 0.8037429934123356, + "support": 29841.0 + }, + "eval_runtime": 4.7804, + "eval_samples_per_second": 16.735, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8573332851434664, - "precision": 0.8573728619273148, - "recall": 0.8577849753775986, - "support": 30257.0 + "f1-score": 0.8479238041544329, + "precision": 0.8481312332795722, + "recall": 0.8479608592205355, + "support": 29841.0 }, "step": 810 }, { "epoch": 11.0, "eval_Claim": { - "f1-score": 0.6253176253176252, - "precision": 0.6289498141263941, - "recall": 0.6217271474506201, - "support": 4354.0 + "f1-score": 0.6350413962855225, + "precision": 0.6477973065510158, + "recall": 0.6227781435154707, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7947071414672116, - "precision": 0.7318996415770609, - "recall": 0.8693060876968923, - "support": 2349.0 + "f1-score": 0.8403837767117314, + "precision": 0.8316788951230039, + "recall": 0.8492728074041428, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9110249527786062, - "precision": 0.9221171261823304, - "recall": 0.900196463654224, - "support": 10180.0 + "f1-score": 0.9076665470637484, + "precision": 0.920883387938357, + "recall": 0.894823723617498, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8996578818752584, - "precision": 0.9047258979206049, - "recall": 0.8946463286974727, - "support": 13374.0 + "f1-score": 0.9016170675363501, + "precision": 0.8904844987250033, + "recall": 0.9130315123159488, + "support": 14534.0 }, - "eval_accuracy": 0.8552731599299336, - "eval_loss": 0.7312190532684326, + "eval_accuracy": 0.8586843604436849, + "eval_loss": 0.753268837928772, "eval_macro avg": { - "f1-score": 0.8076769003596753, - "precision": 0.7969231199515976, - "recall": 0.8214690068748023, - "support": 30257.0 - }, - "eval_runtime": 4.9029, - "eval_samples_per_second": 16.521, - "eval_steps_per_second": 2.244, + "f1-score": 0.8211771968993381, + "precision": 0.822711022084345, + "recall": 0.8199765467132651, + "support": 29841.0 + }, + "eval_runtime": 4.7829, + "eval_samples_per_second": 16.726, + "eval_steps_per_second": 2.091, "eval_weighted avg": { - "f1-score": 0.8558567785115953, - "precision": 0.857475501606145, - "recall": 0.8552731599299336, - "support": 30257.0 + "f1-score": 0.8579718131916827, + "precision": 0.8575920866110881, + "recall": 0.8586843604436849, + "support": 29841.0 }, "step": 891 }, { "epoch": 12.0, "eval_Claim": { - "f1-score": 0.633677135241627, - "precision": 0.6395321637426901, - "recall": 0.6279283417547084, - "support": 4354.0 + "f1-score": 0.6230640668523677, + "precision": 0.6328655500226347, + "recall": 0.6135615536537196, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8290997764681975, - "precision": 0.7931570762052877, - "recall": 0.8684546615581098, - "support": 2349.0 + "f1-score": 0.837270341207349, + "precision": 0.8310898827616153, + "recall": 0.8435434111943587, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.916678984971668, - "precision": 0.9196243203163619, - "recall": 0.9137524557956778, - "support": 10180.0 + "f1-score": 0.8982022214588343, + "precision": 0.8730105731775181, + "recall": 0.9248909326730338, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9029209944129889, - "precision": 0.905603610379842, - "recall": 0.9002542246149244, - "support": 13374.0 + "f1-score": 0.8888346297394397, + "precision": 0.9013795542978422, + "recall": 0.8766340993532407, + "support": 14534.0 }, - "eval_accuracy": 0.8631391083055161, - "eval_loss": 0.7092207074165344, + "eval_accuracy": 0.8476592607486344, + "eval_loss": 0.8125314712524414, "eval_macro avg": { - "f1-score": 0.8205942227736204, - "precision": 0.8144792926610454, - "recall": 0.8275974209308551, - "support": 30257.0 - }, - "eval_runtime": 4.8734, - "eval_samples_per_second": 16.621, - "eval_steps_per_second": 2.257, + "f1-score": 0.8118428148144977, + "precision": 0.8095863900649026, + "recall": 0.8146574992185882, + "support": 29841.0 + }, + "eval_runtime": 4.7824, + "eval_samples_per_second": 16.728, + "eval_steps_per_second": 2.091, "eval_weighted avg": { - "f1-score": 0.8630744313070275, - "precision": 0.8633032778855295, - "recall": 0.8631391083055161, - "support": 30257.0 + "f1-score": 0.846990546753497, + "precision": 0.8469677413197487, + "recall": 0.8476592607486344, + "support": 29841.0 }, "step": 972 }, { "epoch": 12.35, - "grad_norm": 4.426708698272705, + "grad_norm": 15.335172653198242, "learning_rate": 1.506172839506173e-05, - "loss": 0.063, + "loss": 0.061, "step": 1000 }, { "epoch": 13.0, "eval_Claim": { - "f1-score": 0.5936837143530521, - "precision": 0.6096321393998064, - "recall": 0.5785484611851172, - "support": 4354.0 + "f1-score": 0.6158673240699238, + "precision": 0.6292649416075109, + "recall": 0.6030283080974326, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8065005417118094, - "precision": 0.821270962047661, - "recall": 0.7922520221370796, - "support": 2349.0 + "f1-score": 0.8147180492053124, + "precision": 0.8050774526678142, + "recall": 0.8245923314235346, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9133826964170352, - "precision": 0.9242683294780247, - "recall": 0.9027504911591355, - "support": 10180.0 + "f1-score": 0.9060346875742457, + "precision": 0.9128665469778575, + "recall": 0.8993043273198915, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.901282521069989, - "precision": 0.883730957171601, - "recall": 0.9195453865709585, - "support": 13374.0 + "f1-score": 0.9008830850011933, + "precision": 0.8929368029739777, + "recall": 0.9089720655015825, + "support": 14534.0 }, - "eval_accuracy": 0.854942657897346, - "eval_loss": 0.7807008624076843, + "eval_accuracy": 0.8530880332428538, + "eval_loss": 0.8537381887435913, "eval_macro avg": { - "f1-score": 0.8037123683879714, - "precision": 0.8097255970242733, - "recall": 0.7982740902630727, - "support": 30257.0 - }, - "eval_runtime": 4.8517, - "eval_samples_per_second": 16.695, - "eval_steps_per_second": 2.267, + "f1-score": 0.8093757864626687, + "precision": 0.8100364360567901, + "recall": 0.8089742580856103, + "support": 29841.0 + }, + "eval_runtime": 4.7933, + "eval_samples_per_second": 16.69, + "eval_steps_per_second": 2.086, "eval_weighted avg": { - "f1-score": 0.8537315976828396, - "precision": 0.8530777420132861, - "recall": 0.854942657897346, - "support": 30257.0 + "f1-score": 0.8522709558043637, + "precision": 0.8516552983596964, + "recall": 0.8530880332428538, + "support": 29841.0 }, "step": 1053 }, { "epoch": 14.0, "eval_Claim": { - "f1-score": 0.6335702820454024, - "precision": 0.632554945054945, - "recall": 0.6345888837850253, - "support": 4354.0 + "f1-score": 0.6346033728919426, + "precision": 0.6036838978015449, + "recall": 0.6688610928242265, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8183556405353729, - "precision": 0.816793893129771, - "recall": 0.8199233716475096, - "support": 2349.0 + "f1-score": 0.8067737733391228, + "precision": 0.7950363714163458, + "recall": 0.8188629352137505, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9172396976347231, - "precision": 0.9107990314769976, - "recall": 0.9237721021611002, - "support": 10180.0 + "f1-score": 0.9004597838418822, + "precision": 0.9121703363174449, + "recall": 0.8890461030538852, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8981941309255079, - "precision": 0.9039073148568832, - "recall": 0.8925527142216241, - "support": 13374.0 + "f1-score": 0.8921770010096438, + "precision": 0.903023468884347, + "recall": 0.8815880005504335, + "support": 14534.0 }, - "eval_accuracy": 0.8602967908252636, - "eval_loss": 0.7879041433334351, + "eval_accuracy": 0.8464528668610302, + "eval_loss": 0.9449928998947144, "eval_macro avg": { - "f1-score": 0.8168399377852517, - "precision": 0.8160137961296492, - "recall": 0.8177092679538147, - "support": 30257.0 - }, - "eval_runtime": 4.864, - "eval_samples_per_second": 16.653, - "eval_steps_per_second": 2.262, + "f1-score": 0.8085034827706478, + "precision": 0.8034785186049206, + "recall": 0.8145895329105739, + "support": 29841.0 + }, + "eval_runtime": 4.8154, + "eval_samples_per_second": 16.613, + "eval_steps_per_second": 2.077, "eval_weighted avg": { - "f1-score": 0.8603242501425289, - "precision": 0.8604152313535001, - "recall": 0.8602967908252636, - "support": 30257.0 + "f1-score": 0.8487033685671466, + "precision": 0.8517001698367573, + "recall": 0.8464528668610302, + "support": 29841.0 }, "step": 1134 }, { "epoch": 15.0, "eval_Claim": { - "f1-score": 0.6212592513139547, - "precision": 0.5828134433487623, - "recall": 0.6651355075792375, - "support": 4354.0 + "f1-score": 0.6062717770034843, + "precision": 0.5687367813881946, + "recall": 0.6491112574061882, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7988422575976845, - "precision": 0.7765273311897106, - "recall": 0.822477650063857, - "support": 2349.0 + "f1-score": 0.8176843948347561, + "precision": 0.8121739130434783, + "recall": 0.8232701630674306, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9143625765954267, - "precision": 0.9276255938542404, - "recall": 0.9014734774066797, - "support": 10180.0 + "f1-score": 0.8942823803967327, + "precision": 0.8850906571197598, + "recall": 0.9036670203985379, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8928883984627678, - "precision": 0.9090416053304409, - "recall": 0.8772992373261552, - "support": 13374.0 + "f1-score": 0.877618288144604, + "precision": 0.9049777063080184, + "recall": 0.8518645933672767, + "support": 14534.0 }, - "eval_accuracy": 0.8506461314737086, - "eval_loss": 0.8185116052627563, + "eval_accuracy": 0.8334506216279616, + "eval_loss": 1.0531803369522095, "eval_macro avg": { - "f1-score": 0.8068381209924584, - "precision": 0.7990019934307886, - "recall": 0.8165964680939823, - "support": 30257.0 - }, - "eval_runtime": 4.8575, - "eval_samples_per_second": 16.675, - "eval_steps_per_second": 2.265, + "f1-score": 0.7989642100948944, + "precision": 0.7927447644648628, + "recall": 0.8069782585598584, + "support": 29841.0 + }, + "eval_runtime": 4.774, + "eval_samples_per_second": 16.757, + "eval_steps_per_second": 2.095, "eval_weighted avg": { - "f1-score": 0.8537245501570023, - "precision": 0.8580620487302317, - "recall": 0.8506461314737086, - "support": 30257.0 + "f1-score": 0.8363600230462553, + "precision": 0.8409220859889104, + "recall": 0.8334506216279616, + "support": 29841.0 }, "step": 1215 }, { "epoch": 16.0, "eval_Claim": { - "f1-score": 0.620457750298297, - "precision": 0.5878725590955807, - "recall": 0.6568672485071199, - "support": 4354.0 + "f1-score": 0.6349479110729246, + "precision": 0.6217921750105174, + "recall": 0.6486723721746763, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8217720482913852, - "precision": 0.7911741528762806, - "recall": 0.8548318433375904, - "support": 2349.0 + "f1-score": 0.8260292164674634, + "precision": 0.8297020898176968, + "recall": 0.8223887174966946, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9171081176529942, - "precision": 0.9427445285758739, - "recall": 0.8928290766208251, - "support": 10180.0 + "f1-score": 0.9045516104339634, + "precision": 0.9034344860032933, + "recall": 0.9056715010022403, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8952495580546884, - "precision": 0.900703852266707, - "recall": 0.8898609241812472, - "support": 13374.0 + "f1-score": 0.8956702459300312, + "precision": 0.90185546875, + "recall": 0.8895692858125774, + "support": 14534.0 }, - "eval_accuracy": 0.8546121558647586, - "eval_loss": 0.8933361768722534, + "eval_accuracy": 0.8522502597097953, + "eval_loss": 0.9694080352783203, "eval_macro avg": { - "f1-score": 0.8136468685743412, - "precision": 0.8056237732036106, - "recall": 0.8235972731616956, - "support": 30257.0 - }, - "eval_runtime": 4.839, - "eval_samples_per_second": 16.739, - "eval_steps_per_second": 2.273, + "f1-score": 0.8152997459760956, + "precision": 0.8141960548953769, + "recall": 0.8165754691215471, + "support": 29841.0 + }, + "eval_runtime": 4.7829, + "eval_samples_per_second": 16.726, + "eval_steps_per_second": 2.091, "eval_weighted avg": { - "f1-score": 0.8573567707758909, - "precision": 0.8613285464033407, - "recall": 0.8546121558647586, - "support": 30257.0 + "f1-score": 0.8530843968151707, + "precision": 0.854049671322198, + "recall": 0.8522502597097953, + "support": 29841.0 }, "step": 1296 }, { "epoch": 17.0, "eval_Claim": { - "f1-score": 0.577664702731655, - "precision": 0.6926782273603083, - "recall": 0.49540652273771246, - "support": 4354.0 + "f1-score": 0.6241452751933639, + "precision": 0.6379468377635197, + "recall": 0.6109282422646478, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8222534645511148, - "precision": 0.7783269961977186, - "recall": 0.8714346530438485, - "support": 2349.0 + "f1-score": 0.8151592652871426, + "precision": 0.8626968503937008, + "recall": 0.7725870427501101, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9173265135494024, - "precision": 0.9185462424899045, - "recall": 0.9161100196463654, - "support": 10180.0 + "f1-score": 0.9064921025764218, + "precision": 0.9237454100367197, + "recall": 0.8898714774201155, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.901492752578063, - "precision": 0.8705431754874652, - "recall": 0.9347240915208613, - "support": 13374.0 + "f1-score": 0.8993928008319636, + "precision": 0.8775777414075286, + "recall": 0.9223200770606853, + "support": 14534.0 }, - "eval_accuracy": 0.8603298410285223, - "eval_loss": 0.8753499984741211, + "eval_accuracy": 0.8541603833651688, + "eval_loss": 0.985948920249939, "eval_macro avg": { - "f1-score": 0.8046843583525589, - "precision": 0.8150236603838491, - "recall": 0.8044188217371968, - "support": 30257.0 - }, - "eval_runtime": 4.8417, - "eval_samples_per_second": 16.73, - "eval_steps_per_second": 2.272, + "f1-score": 0.8112973609722229, + "precision": 0.8254917099003672, + "recall": 0.7989267098738898, + "support": 29841.0 + }, + "eval_runtime": 4.7769, + "eval_samples_per_second": 16.747, + "eval_steps_per_second": 2.093, "eval_weighted avg": { - "f1-score": 0.8540692561997597, - "precision": 0.8539397922302876, - "recall": 0.8603298410285223, - "support": 30257.0 + "f1-score": 0.8529727851357218, + "precision": 0.85297351326598, + "recall": 0.8541603833651688, + "support": 29841.0 }, "step": 1377 }, { "epoch": 18.0, "eval_Claim": { - "f1-score": 0.6204532891100056, - "precision": 0.5981667021956939, - "recall": 0.6444648598989435, - "support": 4354.0 + "f1-score": 0.638718890248878, + "precision": 0.5967219363445778, + "recall": 0.6870748299319728, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8362068965517241, - "precision": 0.807372175980975, - "recall": 0.8671775223499362, - "support": 2349.0 + "f1-score": 0.778357854769815, + "precision": 0.8431876606683805, + "recall": 0.7227853680035258, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9045747829039926, - "precision": 0.8936068244991853, - "recall": 0.9158153241650294, - "support": 10180.0 + "f1-score": 0.9013165698019214, + "precision": 0.9066937119675457, + "recall": 0.8960028298549699, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8850831280788178, - "precision": 0.9118953211736717, - "recall": 0.8598026020637057, - "support": 13374.0 + "f1-score": 0.8934796194708702, + "precision": 0.9018082422203533, + "recall": 0.885303426448328, + "support": 14534.0 }, - "eval_accuracy": 0.8482334666358198, - "eval_loss": 0.9685499668121338, + "eval_accuracy": 0.8457156261519386, + "eval_loss": 0.9986578822135925, "eval_macro avg": { - "f1-score": 0.811579524161135, - "precision": 0.8027602559623814, - "recall": 0.8218150771194037, - "support": 30257.0 - }, - "eval_runtime": 4.8521, - "eval_samples_per_second": 16.694, - "eval_steps_per_second": 2.267, + "f1-score": 0.8029682335728712, + "precision": 0.8121028878002143, + "recall": 0.7977916135596992, + "support": 29841.0 + }, + "eval_runtime": 4.7848, + "eval_samples_per_second": 16.719, + "eval_steps_per_second": 2.09, "eval_weighted avg": { - "f1-score": 0.8497662248627994, - "precision": 0.8524817583209754, - "recall": 0.8482334666358198, - "support": 30257.0 + "f1-score": 0.8480491462490054, + "precision": 0.8521498954326654, + "recall": 0.8457156261519386, + "support": 29841.0 }, "step": 1458 }, { "epoch": 18.52, - "grad_norm": 0.44517388939857483, + "grad_norm": 11.437110900878906, "learning_rate": 1.2592592592592593e-05, - "loss": 0.0216, + "loss": 0.0189, "step": 1500 }, { "epoch": 19.0, "eval_Claim": { - "f1-score": 0.6178126034654013, - "precision": 0.5946462715105163, - "recall": 0.6428571428571429, - "support": 4354.0 + "f1-score": 0.6127094530509011, + "precision": 0.5894160583941606, + "recall": 0.6379196840026333, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8151062155782848, - "precision": 0.7575868372943327, - "recall": 0.8820774797786292, - "support": 2349.0 + "f1-score": 0.800753453327752, + "precision": 0.762455161418892, + "recall": 0.8431026884089907, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9146588828971454, - "precision": 0.9213595136051032, - "recall": 0.9080550098231827, - "support": 10180.0 + "f1-score": 0.8959336706699994, + "precision": 0.9275435496086847, + "recall": 0.8664072632944229, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8898914207065302, - "precision": 0.9104991394148021, - "recall": 0.870195902497383, - "support": 13374.0 + "f1-score": 0.8912863642630635, + "precision": 0.8930100842657825, + "recall": 0.8895692858125774, + "support": 14534.0 }, - "eval_accuracy": 0.8511418845225898, - "eval_loss": 0.9391252398490906, + "eval_accuracy": 0.8410240943668108, + "eval_loss": 1.0641764402389526, "eval_macro avg": { - "f1-score": 0.8093672806618404, - "precision": 0.7960229404561886, - "recall": 0.8257963837390844, - "support": 30257.0 - }, - "eval_runtime": 4.8661, - "eval_samples_per_second": 16.646, - "eval_steps_per_second": 2.261, + "f1-score": 0.800170735327929, + "precision": 0.79310621342188, + "recall": 0.8092497303796561, + "support": 29841.0 + }, + "eval_runtime": 4.8048, + "eval_samples_per_second": 16.65, + "eval_steps_per_second": 2.081, "eval_weighted avg": { - "f1-score": 0.853266214902463, - "precision": 0.8568303759789367, - "recall": 0.8511418845225898, - "support": 30257.0 + "f1-score": 0.8431820663618932, + "precision": 0.8465361465202841, + "recall": 0.8410240943668108, + "support": 29841.0 }, "step": 1539 }, { "epoch": 20.0, "eval_Claim": { - "f1-score": 0.6097087378640776, - "precision": 0.6064530788457169, - "recall": 0.6129995406522738, - "support": 4354.0 + "f1-score": 0.6346276257161044, + "precision": 0.6142945163277881, + "recall": 0.6563528637261357, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8268961376826096, - "precision": 0.7802114803625377, - "recall": 0.8795232013622818, - "support": 2349.0 + "f1-score": 0.8171902268760908, + "precision": 0.8090712742980561, + "recall": 0.8254737769942706, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9215637325877477, - "precision": 0.9370494466443293, - "recall": 0.906581532416503, - "support": 10180.0 + "f1-score": 0.9044396961063628, + "precision": 0.9106011712680769, + "recall": 0.8983610423299139, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.896644596566042, - "precision": 0.8971479901190209, - "recall": 0.8961417676087932, - "support": 13374.0 + "f1-score": 0.894879267277269, + "precision": 0.902519244226732, + "recall": 0.8873675519471584, + "support": 14534.0 }, - "eval_accuracy": 0.8576197243613048, - "eval_loss": 0.8915661573410034, + "eval_accuracy": 0.8505076907610335, + "eval_loss": 1.087249994277954, "eval_macro avg": { - "f1-score": 0.8137033011751192, - "precision": 0.8052154989929012, - "recall": 0.8238115105099629, - "support": 30257.0 - }, - "eval_runtime": 4.864, - "eval_samples_per_second": 16.653, - "eval_steps_per_second": 2.261, + "f1-score": 0.8127842039939568, + "precision": 0.8091215515301633, + "recall": 0.8168888087493696, + "support": 29841.0 + }, + "eval_runtime": 4.7799, + "eval_samples_per_second": 16.737, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8583235120565212, - "precision": 0.8596633525913644, - "recall": 0.8576197243613048, - "support": 30257.0 + "f1-score": 0.85194635060675, + "precision": 0.8536961248417916, + "recall": 0.8505076907610335, + "support": 29841.0 }, "step": 1620 }, { "epoch": 21.0, "eval_Claim": { - "f1-score": 0.6211416490486258, - "precision": 0.5754014884449667, - "recall": 0.6747818098300413, - "support": 4354.0 + "f1-score": 0.6397356640375187, + "precision": 0.6219689119170985, + "recall": 0.6585472898836954, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8162756902636495, - "precision": 0.7965964343598055, - "recall": 0.8369518944231588, - "support": 2349.0 + "f1-score": 0.8133363574506692, + "precision": 0.8378504672897197, + "recall": 0.7902159541648304, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.911611088790679, - "precision": 0.9325935059597205, - "recall": 0.8915520628683693, - "support": 10180.0 + "f1-score": 0.9003324267150197, + "precision": 0.9236111111111112, + "recall": 0.8781983256691428, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8885090218423553, - "precision": 0.9030190718863408, - "recall": 0.8744579033946464, - "support": 13374.0 + "f1-score": 0.8964765215020788, + "precision": 0.8880637321091007, + "recall": 0.9050502270538049, + "support": 14534.0 }, - "eval_accuracy": 0.8485639686684073, - "eval_loss": 0.9740728735923767, + "eval_accuracy": 0.8510438658221909, + "eval_loss": 1.093902826309204, "eval_macro avg": { - "f1-score": 0.8093843624863275, - "precision": 0.8019026251627084, - "recall": 0.8194359176290539, - "support": 30257.0 - }, - "eval_runtime": 4.884, - "eval_samples_per_second": 16.585, - "eval_steps_per_second": 2.252, + "f1-score": 0.8124702424263215, + "precision": 0.8178735556067575, + "recall": 0.8080029491928683, + "support": 29841.0 + }, + "eval_runtime": 4.813, + "eval_samples_per_second": 16.622, + "eval_steps_per_second": 2.078, "eval_weighted avg": { - "f1-score": 0.852199586158436, - "precision": 0.8575629461968616, - "recall": 0.8485639686684073, - "support": 30257.0 + "f1-score": 0.8520439894961911, + "precision": 0.8537133191814482, + "recall": 0.8510438658221909, + "support": 29841.0 }, "step": 1701 }, { "epoch": 22.0, "eval_Claim": { - "f1-score": 0.6145704312577412, - "precision": 0.6028274795670422, - "recall": 0.6267799724391364, - "support": 4354.0 + "f1-score": 0.6279694722132645, + "precision": 0.6154656552886641, + "recall": 0.640991880623217, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8148905706688483, - "precision": 0.784251968503937, - "recall": 0.8480204342273308, - "support": 2349.0 + "f1-score": 0.8173439463762043, + "precision": 0.7788423153692615, + "recall": 0.8598501542529748, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9175837613108339, - "precision": 0.9137847053093034, - "recall": 0.9214145383104125, - "support": 10180.0 + "f1-score": 0.9038883941822499, + "precision": 0.910210425633668, + "recall": 0.8976535785874308, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8915167877105593, - "precision": 0.9070019342359767, - "recall": 0.876551517870495, - "support": 13374.0 + "f1-score": 0.8954102920723226, + "precision": 0.9051033319274567, + "recall": 0.8859226640979772, + "support": 14534.0 }, - "eval_accuracy": 0.853488448953961, - "eval_loss": 0.9675940871238708, + "eval_accuracy": 0.849870982875909, + "eval_loss": 1.0930607318878174, "eval_macro avg": { - "f1-score": 0.8096403877369956, - "precision": 0.8019665219040648, - "recall": 0.8181916157118437, - "support": 30257.0 - }, - "eval_runtime": 4.8521, - "eval_samples_per_second": 16.694, - "eval_steps_per_second": 2.267, + "f1-score": 0.8111530262110103, + "precision": 0.8024054320547626, + "recall": 0.8211045693904, + "support": 29841.0 + }, + "eval_runtime": 4.8038, + "eval_samples_per_second": 16.654, + "eval_steps_per_second": 2.082, "eval_weighted avg": { - "f1-score": 0.8544854353433136, - "precision": 0.8559834381654265, - "recall": 0.853488448953961, - "support": 30257.0 + "f1-score": 0.8510432276144315, + "precision": 0.8527239921837771, + "recall": 0.849870982875909, + "support": 29841.0 }, "step": 1782 }, { "epoch": 23.0, "eval_Claim": { - "f1-score": 0.5983347015362965, - "precision": 0.6113108075724898, - "recall": 0.5858980248047773, - "support": 4354.0 + "f1-score": 0.6225736879942487, + "precision": 0.5851351351351352, + "recall": 0.6651305683563749, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8269188475918188, - "precision": 0.8553230209281165, - "recall": 0.800340570455513, - "support": 2349.0 + "f1-score": 0.8058810995099083, + "precision": 0.7801155115511551, + "recall": 0.8334067871308947, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9219349129879069, - "precision": 0.9227514268844715, - "recall": 0.9211198428290767, - "support": 10180.0 + "f1-score": 0.8976647945610404, + "precision": 0.9001659947830211, + "recall": 0.8951774554887395, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8949737988043397, - "precision": 0.8835616438356164, - "recall": 0.9066846119336025, - "support": 13374.0 + "f1-score": 0.8881674136288245, + "precision": 0.9116858653915816, + "recall": 0.8658318425760286, + "support": 14534.0 }, - "eval_accuracy": 0.8571239713124236, - "eval_loss": 0.9897539019584656, + "eval_accuracy": 0.8410576053081331, + "eval_loss": 1.1820006370544434, "eval_macro avg": { - "f1-score": 0.8105405652300904, - "precision": 0.8182367248051736, - "recall": 0.8035107625057423, - "support": 30257.0 - }, - "eval_runtime": 4.8416, - "eval_samples_per_second": 16.73, - "eval_steps_per_second": 2.272, + "f1-score": 0.8035717489235055, + "precision": 0.7942756267152233, + "recall": 0.8148866633880094, + "support": 29841.0 + }, + "eval_runtime": 4.7901, + "eval_samples_per_second": 16.701, + "eval_steps_per_second": 2.088, "eval_weighted avg": { - "f1-score": 0.8560749136698399, - "precision": 0.8553777302003576, - "recall": 0.8571239713124236, - "support": 30257.0 + "f1-score": 0.8440512323089471, + "precision": 0.8485403664715132, + "recall": 0.8410576053081331, + "support": 29841.0 }, "step": 1863 }, { "epoch": 24.0, "eval_Claim": { - "f1-score": 0.6090506975161619, - "precision": 0.6016132646202106, - "recall": 0.6166743224621039, - "support": 4354.0 + "f1-score": 0.6244661044792466, + "precision": 0.6233056405771753, + "recall": 0.6256308975202984, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7960317460317461, - "precision": 0.7454477889260498, - "recall": 0.853980417198808, - "support": 2349.0 + "f1-score": 0.8177083333333335, + "precision": 0.8054724241128688, + "recall": 0.8303217276333187, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9115434760806339, - "precision": 0.9310592091784471, - "recall": 0.8928290766208251, - "support": 10180.0 + "f1-score": 0.9007499414108273, + "precision": 0.8951904040992198, + "recall": 0.9063789647447235, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8995695302264645, - "precision": 0.9006821077880219, - "recall": 0.89845969792134, - "support": 13374.0 + "f1-score": 0.8948225108225109, + "precision": 0.9008437347465309, + "recall": 0.888881243979634, + "support": 14534.0 }, - "eval_accuracy": 0.852563043262716, - "eval_loss": 0.9720127582550049, + "eval_accuracy": 0.8492007640494621, + "eval_loss": 1.1699731349945068, "eval_macro avg": { - "f1-score": 0.8040488624637516, - "precision": 0.7947005926281823, - "recall": 0.8154858785507693, - "support": 30257.0 - }, - "eval_runtime": 4.8503, - "eval_samples_per_second": 16.7, - "eval_steps_per_second": 2.268, + "f1-score": 0.8094367225114796, + "precision": 0.8062030508839487, + "recall": 0.8128032084694936, + "support": 29841.0 + }, + "eval_runtime": 4.802, + "eval_samples_per_second": 16.66, + "eval_steps_per_second": 2.082, "eval_weighted avg": { - "f1-score": 0.8537541987693271, - "precision": 0.8558147294621835, - "recall": 0.852563043262716, - "support": 30257.0 + "f1-score": 0.8493576914930753, + "precision": 0.8496026739182283, + "recall": 0.8492007640494621, + "support": 29841.0 }, "step": 1944 }, { "epoch": 24.69, - "grad_norm": 3.446370840072632, + "grad_norm": 9.07358169555664, "learning_rate": 1.0123456790123458e-05, - "loss": 0.0116, + "loss": 0.006, "step": 2000 }, { "epoch": 25.0, "eval_Claim": { - "f1-score": 0.6102259215219976, - "precision": 0.6326429980276134, - "recall": 0.5893431327514929, - "support": 4354.0 + "f1-score": 0.622420524261015, + "precision": 0.632940108892922, + "recall": 0.6122448979591837, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8064243448858834, - "precision": 0.8006714225765842, - "recall": 0.8122605363984674, - "support": 2349.0 + "f1-score": 0.8149307107733571, + "precision": 0.8267573696145125, + "recall": 0.8034376377258704, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9169322709163347, - "precision": 0.9298989898989899, - "recall": 0.9043222003929273, - "support": 10180.0 + "f1-score": 0.9018776855612456, + "precision": 0.9004466384579219, + "recall": 0.9033132885272963, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8993844349992672, - "precision": 0.8818077309958328, - "recall": 0.917676087931808, - "support": 13374.0 + "f1-score": 0.8975866548164354, + "precision": 0.8919157608695653, + "recall": 0.9033301224714463, + "support": 14534.0 }, - "eval_accuracy": 0.8577519251743398, - "eval_loss": 1.0132465362548828, + "eval_accuracy": 0.8512784424114473, + "eval_loss": 1.1391637325286865, "eval_macro avg": { - "f1-score": 0.8082417430808707, - "precision": 0.811255285374755, - "recall": 0.8059004893686739, - "support": 30257.0 - }, - "eval_runtime": 4.8662, - "eval_samples_per_second": 16.645, - "eval_steps_per_second": 2.26, + "f1-score": 0.8092038938530133, + "precision": 0.8130149694587304, + "recall": 0.8055814866709491, + "support": 29841.0 + }, + "eval_runtime": 4.83, + "eval_samples_per_second": 16.563, + "eval_steps_per_second": 2.07, "eval_weighted avg": { - "f1-score": 0.8564613940592988, - "precision": 0.8558341242209939, - "recall": 0.8577519251743398, - "support": 30257.0 + "f1-score": 0.8505008948811765, + "precision": 0.8498378793311306, + "recall": 0.8512784424114473, + "support": 29841.0 }, "step": 2025 }, { "epoch": 26.0, "eval_Claim": { - "f1-score": 0.6123184326089406, - "precision": 0.6006185111552905, - "recall": 0.6244832338079926, - "support": 4354.0 + "f1-score": 0.6216186854970125, + "precision": 0.6155335628227194, + "recall": 0.6278253236778583, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.7939849624060151, - "precision": 0.8013876843018214, - "recall": 0.7867177522349936, - "support": 2349.0 + "f1-score": 0.8021786492374727, + "precision": 0.7931925894011203, + "recall": 0.8113706478624945, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9205986178093769, - "precision": 0.93204469948656, - "recall": 0.9094302554027505, - "support": 10180.0 + "f1-score": 0.9000058854687776, + "precision": 0.8984723854289072, + "recall": 0.9015446291710884, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8996091568955891, - "precision": 0.8957082499444073, - "recall": 0.9035441902198296, - "support": 13374.0 + "f1-score": 0.8959025470653377, + "precision": 0.9012672329759086, + "recall": 0.8906013485619926, + "support": 14534.0 }, - "eval_accuracy": 0.8562977162309549, - "eval_loss": 1.0289610624313354, + "eval_accuracy": 0.8475587279246674, + "eval_loss": 1.18631911277771, "eval_macro avg": { - "f1-score": 0.8066277924299805, - "precision": 0.8074397862220198, - "recall": 0.8060438579163915, - "support": 30257.0 - }, - "eval_runtime": 4.8488, - "eval_samples_per_second": 16.705, - "eval_steps_per_second": 2.269, + "f1-score": 0.80492644181715, + "precision": 0.8021164426571639, + "recall": 0.8078354873183584, + "support": 29841.0 + }, + "eval_runtime": 4.7928, + "eval_samples_per_second": 16.692, + "eval_steps_per_second": 2.086, "eval_weighted avg": { - "f1-score": 0.8571296534981037, - "precision": 0.8581475309358099, - "recall": 0.8562977162309549, - "support": 30257.0 + "f1-score": 0.8480566079768785, + "precision": 0.848621115111045, + "recall": 0.8475587279246674, + "support": 29841.0 }, "step": 2106 }, { "epoch": 27.0, "eval_Claim": { - "f1-score": 0.6028743397617001, - "precision": 0.6480063374702931, - "recall": 0.5636196600826826, - "support": 4354.0 + "f1-score": 0.6274287012839449, + "precision": 0.6505655042412818, + "recall": 0.6058810621022602, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8248976954555244, - "precision": 0.8347863993025283, - "recall": 0.8152405278842061, - "support": 2349.0 + "f1-score": 0.8276779773785763, + "precision": 0.8330357142857143, + "recall": 0.8223887174966946, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9177434297137843, - "precision": 0.9111240197502178, - "recall": 0.9244597249508841, - "support": 10180.0 + "f1-score": 0.9055736912102527, + "precision": 0.9291651159905719, + "recall": 0.8831505718665251, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8988648469931302, - "precision": 0.883512674225464, - "recall": 0.9147599820547331, - "support": 13374.0 + "f1-score": 0.8996312437143815, + "precision": 0.8772228033472803, + "recall": 0.9232145314435117, + "support": 14534.0 }, - "eval_accuracy": 0.8597679875731236, - "eval_loss": 1.0470740795135498, + "eval_accuracy": 0.8557018866659964, + "eval_loss": 1.173492431640625, "eval_macro avg": { - "f1-score": 0.8110950779810349, - "precision": 0.8193573576871258, - "recall": 0.8045199737431264, - "support": 30257.0 - }, - "eval_runtime": 4.8822, - "eval_samples_per_second": 16.591, - "eval_steps_per_second": 2.253, + "f1-score": 0.8150779033967888, + "precision": 0.8224972844662122, + "recall": 0.8086587207272479, + "support": 29841.0 + }, + "eval_runtime": 4.7958, + "eval_samples_per_second": 16.681, + "eval_steps_per_second": 2.085, "eval_weighted avg": { - "f1-score": 0.8568809247486504, - "precision": 0.8551301805022264, - "recall": 0.8597679875731236, - "support": 30257.0 + "f1-score": 0.8542811867471567, + "precision": 0.8540126205927153, + "recall": 0.8557018866659964, + "support": 29841.0 }, "step": 2187 }, { "epoch": 28.0, "eval_Claim": { - "f1-score": 0.6148011951275568, - "precision": 0.6152253909843606, - "recall": 0.6143775838309601, - "support": 4354.0 + "f1-score": 0.6397700895324416, + "precision": 0.644543429844098, + "recall": 0.6350669299978056, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.80912003014886, - "precision": 0.7258282623394186, - "recall": 0.9140059599829715, - "support": 2349.0 + "f1-score": 0.8197434224831485, + "precision": 0.8090128755364807, + "recall": 0.8307624504186867, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9129290270324997, - "precision": 0.9418216001671192, - "recall": 0.8857563850687623, - "support": 10180.0 + "f1-score": 0.9052350945225399, + "precision": 0.9310731646516266, + "recall": 0.8807923593915812, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.897985122051512, - "precision": 0.8978844284966734, - "recall": 0.8980858381935098, - "support": 13374.0 + "f1-score": 0.9018691588785046, + "precision": 0.8879183891185491, + "recall": 0.916265308930783, + "support": 14534.0 }, - "eval_accuracy": 0.8543477542386886, - "eval_loss": 1.0588206052780151, + "eval_accuracy": 0.856740725846989, + "eval_loss": 1.153747797012329, "eval_macro avg": { - "f1-score": 0.8087088435901071, - "precision": 0.7951899204968929, - "recall": 0.8280564417690509, - "support": 30257.0 - }, - "eval_runtime": 4.8745, - "eval_samples_per_second": 16.617, - "eval_steps_per_second": 2.257, + "f1-score": 0.8166544413541587, + "precision": 0.8181369647876886, + "recall": 0.815721762184714, + "support": 29841.0 + }, + "eval_runtime": 4.8135, + "eval_samples_per_second": 16.62, + "eval_steps_per_second": 2.077, "eval_weighted avg": { - "f1-score": 0.8553636471531488, - "precision": 0.8586347680535737, - "recall": 0.8543477542386886, - "support": 30257.0 + "f1-score": 0.8565562586843419, + "precision": 0.8570179283955386, + "recall": 0.856740725846989, + "support": 29841.0 }, "step": 2268 }, { "epoch": 29.0, "eval_Claim": { - "f1-score": 0.6258845012554212, - "precision": 0.6220508166969148, - "recall": 0.6297657326596233, - "support": 4354.0 + "f1-score": 0.6479684334008745, + "precision": 0.6302904564315353, + "recall": 0.6666666666666666, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8182007064201122, - "precision": 0.7991071428571429, - "recall": 0.8382290336313325, - "support": 2349.0 + "f1-score": 0.8285593934288121, + "precision": 0.7934651068979427, + "recall": 0.8669017188188629, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9212816455696202, - "precision": 0.9275189167662286, - "recall": 0.9151277013752456, - "support": 10180.0 + "f1-score": 0.9062767649577879, + "precision": 0.9417673235855054, + "recall": 0.8733639900955076, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8977727868238817, - "precision": 0.8988831421932388, - "recall": 0.8966651712277554, - "support": 13374.0 + "f1-score": 0.8984971414877958, + "precision": 0.8941200517816993, + "recall": 0.9029172973716802, + "support": 14534.0 }, - "eval_accuracy": 0.8599332385894173, - "eval_loss": 1.013275384902954, + "eval_accuracy": 0.8557018866659964, + "eval_loss": 1.141819953918457, "eval_macro avg": { - "f1-score": 0.8157849100172588, - "precision": 0.8118900046283812, - "recall": 0.8199469097234893, - "support": 30257.0 - }, - "eval_runtime": 4.8916, - "eval_samples_per_second": 16.559, - "eval_steps_per_second": 2.249, + "f1-score": 0.8203254333188175, + "precision": 0.8149107346741707, + "recall": 0.8274624182381793, + "support": 29841.0 + }, + "eval_runtime": 4.7777, + "eval_samples_per_second": 16.744, + "eval_steps_per_second": 2.093, "eval_weighted avg": { - "f1-score": 0.860379911449525, - "precision": 0.8609352431120858, - "recall": 0.8599332385894173, - "support": 30257.0 + "f1-score": 0.857132271461693, + "precision": 0.8597190255498753, + "recall": 0.8557018866659964, + "support": 29841.0 }, "step": 2349 }, { "epoch": 30.0, "eval_Claim": { - "f1-score": 0.6191074795725958, - "precision": 0.5691448382126348, - "recall": 0.6786862655029857, - "support": 4354.0 + "f1-score": 0.6132195178221248, + "precision": 0.6464007782101168, + "recall": 0.5832784726793944, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.802213568354171, - "precision": 0.7735177865612648, - "recall": 0.8331204767986378, - "support": 2349.0 + "f1-score": 0.8116131848941279, + "precision": 0.8040657439446367, + "recall": 0.8193036579991185, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9179413083553385, - "precision": 0.9313517338995047, - "recall": 0.9049115913555992, - "support": 10180.0 + "f1-score": 0.9048840121653051, + "precision": 0.9154198841698842, + "recall": 0.8945879023700035, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8899992313014068, - "precision": 0.9156912369503322, - "recall": 0.8657095857634216, - "support": 13374.0 + "f1-score": 0.9030779085055456, + "precision": 0.8853195849031661, + "recall": 0.9215632310444475, + "support": 14534.0 }, - "eval_accuracy": 0.8494563241563936, - "eval_loss": 1.0923724174499512, + "eval_accuracy": 0.8544619818370698, + "eval_loss": 1.1914094686508179, "eval_macro avg": { - "f1-score": 0.8073153968958781, - "precision": 0.797426398905934, - "recall": 0.8206069798551611, - "support": 30257.0 - }, - "eval_runtime": 4.9081, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 2.241, + "f1-score": 0.8081986558467759, + "precision": 0.8128014978069509, + "recall": 0.804683316023241, + "support": 29841.0 + }, + "eval_runtime": 4.773, + "eval_samples_per_second": 16.761, + "eval_steps_per_second": 2.095, "eval_weighted avg": { - "f1-score": 0.853603657884304, - "precision": 0.8600543728816776, - "recall": 0.8494563241563936, - "support": 30257.0 + "f1-score": 0.8523724837851865, + "precision": 0.8512108978901942, + "recall": 0.8544619818370698, + "support": 29841.0 }, "step": 2430 }, { "epoch": 30.86, - "grad_norm": 1.9078470468521118, + "grad_norm": 0.007714413572102785, "learning_rate": 7.654320987654322e-06, - "loss": 0.0059, + "loss": 0.0028, "step": 2500 }, { "epoch": 31.0, "eval_Claim": { - "f1-score": 0.6110219368646335, - "precision": 0.5720296533760769, - "recall": 0.655718879191548, - "support": 4354.0 + "f1-score": 0.6275360746446783, + "precision": 0.6206008583690987, + "recall": 0.6346280447662936, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8156672723601858, - "precision": 0.7757296466973886, - "recall": 0.8599404001702853, - "support": 2349.0 + "f1-score": 0.8174338447854126, + "precision": 0.8249551166965888, + "recall": 0.8100484795063905, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9190938511326862, - "precision": 0.9318525996971226, - "recall": 0.906679764243615, - "support": 10180.0 + "f1-score": 0.9020403293163107, + "precision": 0.9129332206255283, + "recall": 0.8914043155288291, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.890513183575064, - "precision": 0.9120482872148624, - "recall": 0.8699715866606849, - "support": 13374.0 + "f1-score": 0.8989933575292748, + "precision": 0.8947655398037078, + "recall": 0.9032613182881519, + "support": 14534.0 }, - "eval_accuracy": 0.850712231880226, - "eval_loss": 1.0502196550369263, + "eval_accuracy": 0.8517811065312825, + "eval_loss": 1.231397271156311, "eval_macro avg": { - "f1-score": 0.8090740609831424, - "precision": 0.7979150467463627, - "recall": 0.8230776575665333, - "support": 30257.0 - }, - "eval_runtime": 4.8419, - "eval_samples_per_second": 16.729, - "eval_steps_per_second": 2.272, + "f1-score": 0.8115009015689192, + "precision": 0.8133136838737309, + "recall": 0.8098355395224164, + "support": 29841.0 + }, + "eval_runtime": 4.7995, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 2.084, "eval_weighted avg": { - "f1-score": 0.8540995689442556, - "precision": 0.8591995012400396, - "recall": 0.850712231880226, - "support": 30257.0 + "f1-score": 0.8522037725691503, + "precision": 0.8527532680206674, + "recall": 0.8517811065312825, + "support": 29841.0 }, "step": 2511 }, { "epoch": 32.0, "eval_Claim": { - "f1-score": 0.5963855421686747, - "precision": 0.6272174353775976, - "recall": 0.5684428112080845, - "support": 4354.0 + "f1-score": 0.6187466523835029, + "precision": 0.6044370029300963, + "recall": 0.6337502743032697, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8180682764363031, - "precision": 0.8004073319755601, - "recall": 0.8365261813537676, - "support": 2349.0 + "f1-score": 0.8172382671480145, + "precision": 0.8372630605640314, + "recall": 0.7981489643014544, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9205133306804616, - "precision": 0.9323861346231358, - "recall": 0.9089390962671906, - "support": 10180.0 + "f1-score": 0.9010989010989012, + "precision": 0.9079482882451521, + "recall": 0.8943520811225092, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9026587563172929, - "precision": 0.8845822566752799, - "recall": 0.9214894571556752, - "support": 13374.0 + "f1-score": 0.8937414030261347, + "precision": 0.8933727485219304, + "recall": 0.8941103619100041, + "support": 14534.0 }, - "eval_accuracy": 0.8598671381828998, - "eval_loss": 1.0191655158996582, + "eval_accuracy": 0.847123085687477, + "eval_loss": 1.2467483282089233, "eval_macro avg": { - "f1-score": 0.8094064764006831, - "precision": 0.8111482896628934, - "recall": 0.8088493864961794, - "support": 30257.0 - }, - "eval_runtime": 4.8429, - "eval_samples_per_second": 16.725, - "eval_steps_per_second": 2.271, + "f1-score": 0.8077063059141383, + "precision": 0.8107552750653025, + "recall": 0.8050904204093093, + "support": 29841.0 + }, + "eval_runtime": 4.804, + "eval_samples_per_second": 16.653, + "eval_steps_per_second": 2.082, "eval_weighted avg": { - "f1-score": 0.8580258765001771, - "precision": 0.8570960600087044, - "recall": 0.8598671381828998, - "support": 30257.0 + "f1-score": 0.8480211606471663, + "precision": 0.8491256414462351, + "recall": 0.847123085687477, + "support": 29841.0 }, "step": 2592 }, { "epoch": 33.0, "eval_Claim": { - "f1-score": 0.6162361623616236, - "precision": 0.618805002315887, - "recall": 0.6136885622416169, - "support": 4354.0 + "f1-score": 0.6165579750193435, + "precision": 0.6211581291759466, + "recall": 0.6120254553434277, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8282912580847068, - "precision": 0.8121931260229133, - "recall": 0.8450404427415922, - "support": 2349.0 + "f1-score": 0.8063751884557399, + "precision": 0.7885425442291492, + "recall": 0.8250330542089026, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9207272010641968, - "precision": 0.9235939507759218, - "recall": 0.9178781925343812, - "support": 10180.0 + "f1-score": 0.905199879771566, + "precision": 0.9233505028207015, + "recall": 0.8877490861926659, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8987739234449761, - "precision": 0.8986395574824338, - "recall": 0.8989083295947361, - "support": 13374.0 + "f1-score": 0.897230643458119, + "precision": 0.8884841125278283, + "recall": 0.9061510939865144, + "support": 14534.0 }, - "eval_accuracy": 0.8600654394024523, - "eval_loss": 1.0603935718536377, + "eval_accuracy": 0.8498374719345867, + "eval_loss": 1.2608078718185425, "eval_macro avg": { - "f1-score": 0.8160071362388759, - "precision": 0.813307909149289, - "recall": 0.8188788817780815, - "support": 30257.0 - }, - "eval_runtime": 4.8566, - "eval_samples_per_second": 16.678, - "eval_steps_per_second": 2.265, + "f1-score": 0.8063409216761921, + "precision": 0.8053838221884064, + "recall": 0.8077396724328777, + "support": 29841.0 + }, + "eval_runtime": 4.7947, + "eval_samples_per_second": 16.685, + "eval_steps_per_second": 2.086, "eval_weighted avg": { - "f1-score": 0.8600308614585094, - "precision": 0.8600558711630416, - "recall": 0.8600654394024523, - "support": 30257.0 + "f1-score": 0.8497258921327092, + "precision": 0.8499709906977834, + "recall": 0.8498374719345867, + "support": 29841.0 }, "step": 2673 }, { "epoch": 34.0, "eval_Claim": { - "f1-score": 0.6198869304955105, - "precision": 0.5991000642811227, - "recall": 0.6421681212677998, - "support": 4354.0 + "f1-score": 0.6242761692650335, + "precision": 0.633732760569749, + "recall": 0.6150976519640114, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8214212991244145, - "precision": 0.7872755659640905, - "recall": 0.8586632609621115, - "support": 2349.0 + "f1-score": 0.8270332187857962, + "precision": 0.8611641221374046, + "recall": 0.7955046275892463, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9196205691462807, - "precision": 0.9350253807106599, - "recall": 0.9047151277013753, - "support": 10180.0 + "f1-score": 0.9015324995596267, + "precision": 0.8978947368421053, + "recall": 0.9051998585072515, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.897408858089786, - "precision": 0.9040825618455001, - "recall": 0.8908329594736055, - "support": 13374.0 + "f1-score": 0.8962669760458609, + "precision": 0.8890468453831574, + "recall": 0.9036053392046236, + "support": 14534.0 }, - "eval_accuracy": 0.8572231219221998, - "eval_loss": 1.002353310585022, + "eval_accuracy": 0.8517811065312825, + "eval_loss": 1.2305262088775635, "eval_macro avg": { - "f1-score": 0.8145844142139979, - "precision": 0.8063708932003434, - "recall": 0.8240948673512231, - "support": 30257.0 - }, - "eval_runtime": 4.8525, - "eval_samples_per_second": 16.692, - "eval_steps_per_second": 2.267, + "f1-score": 0.8122772159140793, + "precision": 0.820459616233104, + "recall": 0.8048518693162833, + "support": 29841.0 + }, + "eval_runtime": 4.7809, + "eval_samples_per_second": 16.733, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8590471556672056, - "precision": 0.8615378438736785, - "recall": 0.8572231219221998, - "support": 30257.0 + "f1-score": 0.8509636485165197, + "precision": 0.8504525215978962, + "recall": 0.8517811065312825, + "support": 29841.0 }, "step": 2754 }, { "epoch": 35.0, "eval_Claim": { - "f1-score": 0.6195019781242729, - "precision": 0.6278301886792453, - "recall": 0.6113918236104732, - "support": 4354.0 + "f1-score": 0.633076593923834, + "precision": 0.6176163640158631, + "recall": 0.6493307000219443, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8297086581862947, - "precision": 0.8007920792079208, - "recall": 0.8607918263090677, - "support": 2349.0 + "f1-score": 0.8311867525298988, + "precision": 0.8691678691678691, + "recall": 0.7963860731599823, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9212497535974769, - "precision": 0.9243473101265823, - "recall": 0.9181728880157171, - "support": 10180.0 + "f1-score": 0.9039272770483037, + "precision": 0.9110179640718563, + "recall": 0.8969461148449476, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9000523286237572, - "precision": 0.8998505231689088, - "recall": 0.9002542246149244, - "support": 13374.0 + "f1-score": 0.8963128108386212, + "precision": 0.8936461254360167, + "recall": 0.8989954589239025, + "support": 14534.0 }, - "eval_accuracy": 0.8616518491588723, - "eval_loss": 1.005292296409607, + "eval_accuracy": 0.8524848362990516, + "eval_loss": 1.2047479152679443, "eval_macro avg": { - "f1-score": 0.8176281796329504, - "precision": 0.8132050252956643, - "recall": 0.8226526906375455, - "support": 30257.0 - }, - "eval_runtime": 4.883, - "eval_samples_per_second": 16.588, - "eval_steps_per_second": 2.253, + "f1-score": 0.8161258585851644, + "precision": 0.8228620806729012, + "recall": 0.8104145867376942, + "support": 29841.0 + }, + "eval_runtime": 4.7907, + "eval_samples_per_second": 16.699, + "eval_steps_per_second": 2.087, "eval_weighted avg": { - "f1-score": 0.8613517396129535, - "precision": 0.8612582129595939, - "recall": 0.8616518491588723, - "support": 30257.0 + "f1-score": 0.8533263097542454, + "precision": 0.8545697465347227, + "recall": 0.8524848362990516, + "support": 29841.0 }, "step": 2835 }, { "epoch": 36.0, "eval_Claim": { - "f1-score": 0.6118366866690199, - "precision": 0.6272617611580217, - "recall": 0.5971520440973818, - "support": 4354.0 + "f1-score": 0.6346997752327946, + "precision": 0.6195152528207272, + "recall": 0.6506473557164801, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8270394325057375, - "precision": 0.8109656301145662, - "recall": 0.8437633035334184, - "support": 2349.0 + "f1-score": 0.8192934782608694, + "precision": 0.8425710293432697, + "recall": 0.7972675187307183, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9219198416625434, - "precision": 0.9288135593220339, - "recall": 0.9151277013752456, - "support": 10180.0 + "f1-score": 0.9063178271836687, + "precision": 0.9018211533971515, + "recall": 0.9108595684471171, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8994520953650229, - "precision": 0.8907464437600822, - "recall": 0.908329594736055, - "support": 13374.0 + "f1-score": 0.8959689707715751, + "precision": 0.9019662529633246, + "recall": 0.8900509150956378, + "support": 14534.0 }, - "eval_accuracy": 0.8608255940774036, - "eval_loss": 1.0221480131149292, + "eval_accuracy": 0.8523507925337622, + "eval_loss": 1.2302902936935425, "eval_macro avg": { - "f1-score": 0.8150620140505809, - "precision": 0.814446848588676, - "recall": 0.8160931609355251, - "support": 30257.0 - }, - "eval_runtime": 4.8502, - "eval_samples_per_second": 16.7, - "eval_steps_per_second": 2.268, + "f1-score": 0.8140700128622269, + "precision": 0.8164684221311183, + "recall": 0.8122063394974884, + "support": 29841.0 + }, + "eval_runtime": 4.803, + "eval_samples_per_second": 16.656, + "eval_steps_per_second": 2.082, "eval_weighted avg": { - "f1-score": 0.8600016152377763, - "precision": 0.8594447878496476, - "recall": 0.8608255940774036, - "support": 30257.0 + "f1-score": 0.8531818066233882, + "precision": 0.8542759088239045, + "recall": 0.8523507925337622, + "support": 29841.0 }, "step": 2916 }, { "epoch": 37.0, "eval_Claim": { - "f1-score": 0.5992254430231193, - "precision": 0.6126709863210943, - "recall": 0.586357372531006, - "support": 4354.0 + "f1-score": 0.6348107625320978, + "precision": 0.6461363636363636, + "recall": 0.6238753565942506, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8153438073862477, - "precision": 0.7829153605015674, - "recall": 0.8505747126436781, - "support": 2349.0 + "f1-score": 0.821917808219178, + "precision": 0.8526764566556134, + "recall": 0.7933010136624064, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9200099181750558, - "precision": 0.928993490235353, - "recall": 0.9111984282907662, - "support": 10180.0 + "f1-score": 0.9034164794893014, + "precision": 0.9057721939077872, + "recall": 0.9010729866760995, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8983548111560886, - "precision": 0.8924223419169187, - "recall": 0.9043666816210558, - "support": 13374.0 + "f1-score": 0.9000577700751011, + "precision": 0.8892096958302558, + "recall": 0.9111737993670015, + "support": 14534.0 }, - "eval_accuracy": 0.8567273688733186, - "eval_loss": 1.0784204006195068, + "eval_accuracy": 0.85546731007674, + "eval_loss": 1.2363109588623047, "eval_macro avg": { - "f1-score": 0.8082334949351277, - "precision": 0.8042505447437334, - "recall": 0.8131242987716265, - "support": 30257.0 - }, - "eval_runtime": 4.8665, - "eval_samples_per_second": 16.644, - "eval_steps_per_second": 2.26, + "f1-score": 0.8150507050789195, + "precision": 0.823448677507505, + "recall": 0.8073557890749394, + "support": 29841.0 + }, + "eval_runtime": 4.7822, + "eval_samples_per_second": 16.729, + "eval_steps_per_second": 2.091, "eval_weighted avg": { - "f1-score": 0.8561512507484733, - "precision": 0.855968793590012, - "recall": 0.8567273688733186, - "support": 30257.0 + "f1-score": 0.8545651601664946, + "precision": 0.8540194358423435, + "recall": 0.85546731007674, + "support": 29841.0 }, "step": 2997 }, { "epoch": 37.04, - "grad_norm": 0.5529414415359497, + "grad_norm": 0.3124696612358093, "learning_rate": 5.185185185185185e-06, - "loss": 0.0056, + "loss": 0.0015, "step": 3000 }, { "epoch": 38.0, "eval_Claim": { - "f1-score": 0.5970562334884891, - "precision": 0.6600834492350487, - "recall": 0.545016077170418, - "support": 4354.0 + "f1-score": 0.6297771557756486, + "precision": 0.6181318681318682, + "recall": 0.6418696510862409, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8171079429735234, - "precision": 0.7832877782116361, - "recall": 0.853980417198808, - "support": 2349.0 + "f1-score": 0.8197488827410088, + "precision": 0.7925925925925926, + "recall": 0.8488320846187748, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9201859554685589, - "precision": 0.9168210628961482, - "recall": 0.9235756385068762, - "support": 10180.0 + "f1-score": 0.9054678007290401, + "precision": 0.9339516230104024, + "recall": 0.8786699681641316, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9016899338721528, - "precision": 0.886320959121768, - "recall": 0.917601315986242, - "support": 13374.0 + "f1-score": 0.8958062529930902, + "precision": 0.8907482993197279, + "recall": 0.9009219760561442, + "support": 14534.0 }, - "eval_accuracy": 0.8610569455002148, - "eval_loss": 1.0626990795135498, + "eval_accuracy": 0.8510773767635132, + "eval_loss": 1.264951467514038, "eval_macro avg": { - "f1-score": 0.809010016450681, - "precision": 0.8116283123661503, - "recall": 0.810043362215586, - "support": 30257.0 - }, - "eval_runtime": 4.8375, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 2.274, + "f1-score": 0.812700023059697, + "precision": 0.8088560957636478, + "recall": 0.8175734199813228, + "support": 29841.0 + }, + "eval_runtime": 4.8007, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 2.083, "eval_weighted avg": { - "f1-score": 0.857509455693882, - "precision": 0.8560280681021202, - "recall": 0.8610569455002148, - "support": 30257.0 + "f1-score": 0.8521438696020087, + "precision": 0.8539324758799526, + "recall": 0.8510773767635132, + "support": 29841.0 }, "step": 3078 }, { "epoch": 39.0, "eval_Claim": { - "f1-score": 0.6197119201542475, - "precision": 0.6121442975576966, - "recall": 0.6274689940284796, - "support": 4354.0 + "f1-score": 0.6320949994552784, + "precision": 0.6276503678061445, + "recall": 0.6366030283080975, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8049129989764585, - "precision": 0.7752365930599369, - "recall": 0.8369518944231588, - "support": 2349.0 + "f1-score": 0.8298865910607072, + "precision": 0.8375224416517055, + "recall": 0.8223887174966946, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9190203436697609, - "precision": 0.9239475774424146, - "recall": 0.9141453831041257, - "support": 10180.0 + "f1-score": 0.9067027918482744, + "precision": 0.90584912321996, + "recall": 0.9075580709821955, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8999246987951808, - "precision": 0.9063400576368876, - "recall": 0.8935995214595484, - "support": 13374.0 + "f1-score": 0.897340498828717, + "precision": 0.8985787222298882, + "recall": 0.8961056832255401, + "support": 14534.0 }, - "eval_accuracy": 0.8578180255808573, - "eval_loss": 1.0806539058685303, + "eval_accuracy": 0.8541268724238464, + "eval_loss": 1.2218141555786133, "eval_macro avg": { - "f1-score": 0.8108924903989119, - "precision": 0.8044171314242339, - "recall": 0.8180414482538281, - "support": 30257.0 - }, - "eval_runtime": 4.879, - "eval_samples_per_second": 16.602, - "eval_steps_per_second": 2.255, + "f1-score": 0.8165062202982443, + "precision": 0.8174001637269246, + "recall": 0.8156638750031319, + "support": 29841.0 + }, + "eval_runtime": 4.7791, + "eval_samples_per_second": 16.74, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8586504397393069, - "precision": 0.8597509765628951, - "recall": 0.8578180255808573, - "support": 30257.0 + "f1-score": 0.8543669037658335, + "precision": 0.85462922519748, + "recall": 0.8541268724238464, + "support": 29841.0 }, "step": 3159 }, { "epoch": 40.0, "eval_Claim": { - "f1-score": 0.6083916083916084, - "precision": 0.6403553299492386, - "recall": 0.5794671566375746, - "support": 4354.0 + "f1-score": 0.6463350510043117, + "precision": 0.6205573505654282, + "recall": 0.674347158218126, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.806698366756254, - "precision": 0.7841639871382636, - "recall": 0.8305661983822903, - "support": 2349.0 + "f1-score": 0.8254958769779362, + "precision": 0.8349864743011722, + "recall": 0.8162185985015425, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9171535580524344, - "precision": 0.9327577450482478, - "recall": 0.9020628683693517, - "support": 10180.0 + "f1-score": 0.9064204783885857, + "precision": 0.9219512195121952, + "recall": 0.8914043155288291, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.9035748227209591, - "precision": 0.8838672768878718, - "recall": 0.924181247196052, - "support": 13374.0 + "f1-score": 0.8983278745043958, + "precision": 0.9002833252712321, + "recall": 0.8963808999587175, + "support": 14534.0 }, - "eval_accuracy": 0.8598671381828998, - "eval_loss": 1.0857013463974, + "eval_accuracy": 0.8549646459569049, + "eval_loss": 1.2532273530960083, "eval_macro avg": { - "f1-score": 0.808954588980314, - "precision": 0.8102860847559054, - "recall": 0.8090693676463172, - "support": 30257.0 - }, - "eval_runtime": 4.8891, - "eval_samples_per_second": 16.568, - "eval_steps_per_second": 2.25, + "f1-score": 0.8191448202188073, + "precision": 0.8194445924125069, + "recall": 0.8195877430518038, + "support": 29841.0 + }, + "eval_runtime": 4.7911, + "eval_samples_per_second": 16.697, + "eval_steps_per_second": 2.087, "eval_weighted avg": { - "f1-score": 0.8581453688895593, - "precision": 0.8575345578899536, - "recall": 0.8598671381828998, - "support": 30257.0 + "f1-score": 0.8566083032589413, + "precision": 0.8587597700777799, + "recall": 0.8549646459569049, + "support": 29841.0 }, "step": 3240 }, { "epoch": 41.0, "eval_Claim": { - "f1-score": 0.633541759714158, - "precision": 0.616471099521947, - "recall": 0.6515847496554892, - "support": 4354.0 + "f1-score": 0.6371372463451888, + "precision": 0.6335430679106097, + "recall": 0.6407724380074611, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8099445243476474, - "precision": 0.7827640984908658, - "recall": 0.8390804597701149, - "support": 2349.0 + "f1-score": 0.8270404702690481, + "precision": 0.8491179201485608, + "recall": 0.8060819744380785, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9174538800138484, - "precision": 0.9238968024703655, - "recall": 0.9111001964636543, - "support": 10180.0 + "f1-score": 0.9051774973463852, + "precision": 0.905391058157367, + "recall": 0.9049640372597572, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8984587488667273, - "precision": 0.907924874026569, - "recall": 0.889187976671153, - "support": 13374.0 + "f1-score": 0.8991934099879869, + "precision": 0.8971303335387987, + "recall": 0.9012659969726159, + "support": 14534.0 }, - "eval_accuracy": 0.8584790296460323, - "eval_loss": 1.082669973373413, + "eval_accuracy": 0.8552997553701284, + "eval_loss": 1.2720471620559692, "eval_macro avg": { - "f1-score": 0.8148497282355953, - "precision": 0.8077642186274367, - "recall": 0.8227383456401028, - "support": 30257.0 - }, - "eval_runtime": 4.8808, - "eval_samples_per_second": 16.596, - "eval_steps_per_second": 2.254, + "f1-score": 0.8171371559871523, + "precision": 0.821295594938834, + "recall": 0.8132711116694782, + "support": 29841.0 + }, + "eval_runtime": 4.7858, + "eval_samples_per_second": 16.716, + "eval_steps_per_second": 2.09, "eval_weighted avg": { - "f1-score": 0.8598561759385482, - "precision": 0.8616414300510049, - "recall": 0.8584790296460323, - "support": 30257.0 + "f1-score": 0.8553894519083003, + "precision": 0.8555751534188286, + "recall": 0.8552997553701284, + "support": 29841.0 }, "step": 3321 }, { "epoch": 42.0, "eval_Claim": { - "f1-score": 0.6143497757847534, - "precision": 0.6000876040297853, - "recall": 0.6293063849333945, - "support": 4354.0 + "f1-score": 0.6300342759211655, + "precision": 0.6154007114459091, + "recall": 0.6453807329383366, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8115216030056356, - "precision": 0.7960687960687961, - "recall": 0.8275862068965517, - "support": 2349.0 + "f1-score": 0.8309070548712206, + "precision": 0.8447176684881603, + "recall": 0.8175407668576465, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9185947728749189, - "precision": 0.9348998067338012, - "recall": 0.9028487229862475, - "support": 10180.0 + "f1-score": 0.9059788703299297, + "precision": 0.9069959820373434, + "recall": 0.9049640372597572, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8983278590624066, - "precision": 0.8968549709345655, - "recall": 0.8998055929415283, - "support": 13374.0 + "f1-score": 0.8946713663694795, + "precision": 0.8987086920299917, + "recall": 0.8906701527452869, + "support": 14534.0 }, - "eval_accuracy": 0.8562977162309549, - "eval_loss": 1.1027238368988037, + "eval_accuracy": 0.8517140846486377, + "eval_loss": 1.273967981338501, "eval_macro avg": { - "f1-score": 0.8106985026819286, - "precision": 0.806977794441737, - "recall": 0.8148867269394304, - "support": 30257.0 - }, - "eval_runtime": 4.8725, - "eval_samples_per_second": 16.624, - "eval_steps_per_second": 2.258, + "f1-score": 0.8153978918729488, + "precision": 0.8164557635003511, + "recall": 0.8146389224502568, + "support": 29841.0 + }, + "eval_runtime": 4.785, + "eval_samples_per_second": 16.719, + "eval_steps_per_second": 2.09, "eval_weighted avg": { - "f1-score": 0.8575428741842996, - "precision": 0.8591256715384956, - "recall": 0.8562977162309549, - "support": 30257.0 + "f1-score": 0.8526240655794947, + "precision": 0.8536949326591351, + "recall": 0.8517140846486377, + "support": 29841.0 }, "step": 3402 }, { "epoch": 43.0, "eval_Claim": { - "f1-score": 0.6311159978009895, - "precision": 0.6053575195106518, - "recall": 0.6591639871382636, - "support": 4354.0 + "f1-score": 0.6327562103451985, + "precision": 0.620413327709827, + "recall": 0.6456001755540927, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8066581306017925, - "precision": 0.8087291399229781, - "recall": 0.8045977011494253, - "support": 2349.0 + "f1-score": 0.8331148973350809, + "precision": 0.8258986574274578, + "recall": 0.8404583516967827, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9192947603675194, - "precision": 0.9296835760924159, - "recall": 0.9091355599214146, - "support": 10180.0 + "f1-score": 0.9066080864454076, + "precision": 0.9130590767758909, + "recall": 0.9002476123098692, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8996917061433192, - "precision": 0.904794313369631, - "recall": 0.8946463286974727, - "support": 13374.0 + "f1-score": 0.8955873213175887, + "precision": 0.8988771832547824, + "recall": 0.8923214531443512, + "support": 14534.0 }, - "eval_accuracy": 0.8586442806623261, - "eval_loss": 1.0912280082702637, + "eval_accuracy": 0.8529539894775644, + "eval_loss": 1.2849647998809814, "eval_macro avg": { - "f1-score": 0.8141901487284051, - "precision": 0.8121411372239192, - "recall": 0.816885894226644, - "support": 30257.0 - }, - "eval_runtime": 4.8617, - "eval_samples_per_second": 16.661, - "eval_steps_per_second": 2.263, + "f1-score": 0.8170166288608189, + "precision": 0.8145620612919895, + "recall": 0.819656898176274, + "support": 29841.0 + }, + "eval_runtime": 4.7796, + "eval_samples_per_second": 16.738, + "eval_steps_per_second": 2.092, "eval_weighted avg": { - "f1-score": 0.8604163182639131, - "precision": 0.8626211898487851, - "recall": 0.8586442806623261, - "support": 30257.0 + "f1-score": 0.8538325478961732, + "precision": 0.8548347106208881, + "recall": 0.8529539894775644, + "support": 29841.0 }, "step": 3483 }, { "epoch": 43.21, - "grad_norm": 1.988065481185913, + "grad_norm": 11.103137969970703, "learning_rate": 2.7160493827160496e-06, - "loss": 0.0038, + "loss": 0.001, "step": 3500 }, { "epoch": 44.0, "eval_Claim": { - "f1-score": 0.6289838978345363, - "precision": 0.6089013115459041, - "recall": 0.6504363803399174, - "support": 4354.0 + "f1-score": 0.6296918767507003, + "precision": 0.6433150183150184, + "recall": 0.6166337502743032, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8161013485901104, - "precision": 0.7846758349705305, - "recall": 0.8501489995742869, - "support": 2349.0 + "f1-score": 0.8321428571428572, + "precision": 0.8430574400723655, + "recall": 0.8215072719259586, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9186826287814813, - "precision": 0.9292533413727263, - "recall": 0.9083497053045186, - "support": 10180.0 + "f1-score": 0.908139604019264, + "precision": 0.9159270808347325, + "recall": 0.9004834335573635, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8984292402960278, - "precision": 0.9074752097635392, - "recall": 0.8895618363989831, - "support": 13374.0 + "f1-score": 0.9008079299341435, + "precision": 0.8890377914768158, + "recall": 0.9128939039493601, + "support": 14534.0 }, - "eval_accuracy": 0.8584129292395148, - "eval_loss": 1.096985101699829, + "eval_accuracy": 0.8571763680841795, + "eval_loss": 1.2746751308441162, "eval_macro avg": { - "f1-score": 0.815549278875539, - "precision": 0.807576424413175, - "recall": 0.8246242304044265, - "support": 30257.0 - }, - "eval_runtime": 4.8433, - "eval_samples_per_second": 16.724, - "eval_steps_per_second": 2.271, + "f1-score": 0.8176955669617412, + "precision": 0.822834332674733, + "recall": 0.8128795899267465, + "support": 29841.0 + }, + "eval_runtime": 4.7778, + "eval_samples_per_second": 16.744, + "eval_steps_per_second": 2.093, "eval_weighted avg": { - "f1-score": 0.860078652203599, - "precision": 0.8623040062586698, - "recall": 0.8584129292395148, - "support": 30257.0 + "f1-score": 0.8562686391394492, + "precision": 0.8556595524234826, + "recall": 0.8571763680841795, + "support": 29841.0 }, "step": 3564 }, { "epoch": 45.0, "eval_Claim": { - "f1-score": 0.6183596860425435, - "precision": 0.6125760649087221, - "recall": 0.6242535599448783, - "support": 4354.0 + "f1-score": 0.6363438992618324, + "precision": 0.6296455424274973, + "recall": 0.6431863067807768, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8194356036494802, - "precision": 0.8168358714043993, - "recall": 0.8220519369944658, - "support": 2349.0 + "f1-score": 0.8294691224268689, + "precision": 0.8158567774936062, + "recall": 0.8435434111943587, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9192996379147859, - "precision": 0.9284640817553351, - "recall": 0.9103143418467583, - "support": 10180.0 + "f1-score": 0.9093409879201052, + "precision": 0.9225822108967359, + "recall": 0.8964744723499587, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8989534060858877, - "precision": 0.8955844155844156, - "recall": 0.9023478390907731, - "support": 13374.0 + "f1-score": 0.8978134761267291, + "precision": 0.8958147818343722, + "recall": 0.8998211091234347, + "support": 14534.0 }, - "eval_accuracy": 0.8587764814753611, - "eval_loss": 1.090890645980835, + "eval_accuracy": 0.8554002881940954, + "eval_loss": 1.2960079908370972, "eval_macro avg": { - "f1-score": 0.8140120834231743, - "precision": 0.813365108413218, - "recall": 0.8147419194692188, - "support": 30257.0 - }, - "eval_runtime": 4.8953, - "eval_samples_per_second": 16.546, - "eval_steps_per_second": 2.247, + "f1-score": 0.8182418714338839, + "precision": 0.8159748281630528, + "recall": 0.8207563248621323, + "support": 29841.0 + }, + "eval_runtime": 4.79, + "eval_samples_per_second": 16.701, + "eval_steps_per_second": 2.088, "eval_weighted avg": { - "f1-score": 0.8592479582565041, - "precision": 0.8598081096882307, - "recall": 0.8587764814753611, - "support": 30257.0 + "f1-score": 0.8559641623370206, + "precision": 0.8566960066610061, + "recall": 0.8554002881940954, + "support": 29841.0 }, "step": 3645 }, { "epoch": 46.0, "eval_Claim": { - "f1-score": 0.6084337349397592, - "precision": 0.613838242169238, - "recall": 0.6031235645383556, - "support": 4354.0 + "f1-score": 0.6322691604858648, + "precision": 0.6196797302991993, + "recall": 0.6453807329383366, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8203753351206435, - "precision": 0.7956, - "recall": 0.8467432950191571, - "support": 2349.0 + "f1-score": 0.8332607749238136, + "precision": 0.8232258064516129, + "recall": 0.8435434111943587, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.918908188585608, - "precision": 0.9285857572718155, - "recall": 0.9094302554027505, - "support": 10180.0 + "f1-score": 0.9089284650664124, + "precision": 0.9183919114106885, + "recall": 0.8996580591911332, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8986348249823308, - "precision": 0.8941446443111999, - "recall": 0.9031703304919994, - "support": 13374.0 + "f1-score": 0.895985653193544, + "precision": 0.8982160143825197, + "recall": 0.8937663409935324, + "support": 14534.0 }, - "eval_accuracy": 0.8577188749710811, - "eval_loss": 1.0958248376846313, + "eval_accuracy": 0.8536912301866559, + "eval_loss": 1.2958593368530273, "eval_macro avg": { - "f1-score": 0.8115880209070854, - "precision": 0.8080421609380632, - "recall": 0.8156168613630657, - "support": 30257.0 - }, - "eval_runtime": 4.8566, - "eval_samples_per_second": 16.678, - "eval_steps_per_second": 2.265, + "f1-score": 0.8176110134174086, + "precision": 0.8148783656360051, + "recall": 0.8205871360793402, + "support": 29841.0 + }, + "eval_runtime": 4.7995, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 2.084, "eval_weighted avg": { - "f1-score": 0.8576200434028913, - "precision": 0.8577456320339072, - "recall": 0.8577188749710811, - "support": 30257.0 + "f1-score": 0.8546227357789428, + "precision": 0.8557130538360561, + "recall": 0.8536912301866559, + "support": 29841.0 }, "step": 3726 }, { "epoch": 47.0, "eval_Claim": { - "f1-score": 0.6183818473527389, - "precision": 0.6171088746569076, - "recall": 0.6196600826825908, - "support": 4354.0 + "f1-score": 0.6343719035560937, + "precision": 0.6365444100751215, + "recall": 0.6322141759929778, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8325883787078424, - "precision": 0.7963466770307035, - "recall": 0.8722860791826309, - "support": 2349.0 + "f1-score": 0.8321970530019793, + "precision": 0.8305531167690957, + "recall": 0.8338475099162627, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.9196415309204337, - "precision": 0.9271238893880404, - "recall": 0.9122789783889981, - "support": 10180.0 + "f1-score": 0.9086917828537526, + "precision": 0.9144972534033915, + "recall": 0.9029595566560548, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.8969965128051295, - "precision": 0.8996615268898082, - "recall": 0.8943472409152086, - "support": 13374.0 + "f1-score": 0.8988594718635478, + "precision": 0.8949055445679601, + "recall": 0.9028484931883859, + "support": 14534.0 }, - "eval_accuracy": 0.8591400337112073, - "eval_loss": 1.0940934419631958, + "eval_accuracy": 0.8563050836097986, + "eval_loss": 1.28843092918396, "eval_macro avg": { - "f1-score": 0.8169020674465362, - "precision": 0.810060241991365, - "recall": 0.824643095292357, - "support": 30257.0 - }, - "eval_runtime": 4.8579, - "eval_samples_per_second": 16.674, - "eval_steps_per_second": 2.264, + "f1-score": 0.8185300528188434, + "precision": 0.8191250812038922, + "recall": 0.8179674339384202, + "support": 29841.0 + }, + "eval_runtime": 4.7779, + "eval_samples_per_second": 16.744, + "eval_steps_per_second": 2.093, "eval_weighted avg": { - "f1-score": 0.8595223191983462, - "precision": 0.8602209352941748, - "recall": 0.8591400337112073, - "support": 30257.0 + "f1-score": 0.8561953839420291, + "precision": 0.8561263459510842, + "recall": 0.8563050836097986, + "support": 29841.0 }, "step": 3807 }, { "epoch": 48.0, "eval_Claim": { - "f1-score": 0.6188739457488033, - "precision": 0.6142533936651584, - "recall": 0.6235645383555352, - "support": 4354.0 + "f1-score": 0.6376558058167504, + "precision": 0.6354325561124428, + "recall": 0.6398946675444371, + "support": 4557.0 }, "eval_MajorClaim": { - "f1-score": 0.8311582381729201, - "precision": 0.7976516634050881, - "recall": 0.8676032354193274, - "support": 2349.0 + "f1-score": 0.8332228849127457, + "precision": 0.8352524357838795, + "recall": 0.8312031732040547, + "support": 2269.0 }, "eval_O": { - "f1-score": 0.91950954217344, - "precision": 0.9256420465857057, - "recall": 0.9134577603143419, - "support": 10180.0 + "f1-score": 0.9087235559781318, + "precision": 0.9160177309212891, + "recall": 0.9015446291710884, + "support": 8481.0 }, "eval_Premise": { - "f1-score": 0.89695603156708, - "precision": 0.9016319129646418, - "recall": 0.892328398384926, - "support": 13374.0 + "f1-score": 0.8999006202666118, + "precision": 0.8964293029289274, + "recall": 0.9033989266547406, + "support": 14534.0 }, - "eval_accuracy": 0.8588425818818786, - "eval_loss": 1.095285415649414, + "eval_accuracy": 0.8571428571428571, + "eval_loss": 1.2850925922393799, "eval_macro avg": { - "f1-score": 0.8166244394155608, - "precision": 0.8097947541551485, - "recall": 0.8242384831185325, - "support": 30257.0 - }, - "eval_runtime": 4.8519, - "eval_samples_per_second": 16.695, - "eval_steps_per_second": 2.267, + "f1-score": 0.81987571674356, + "precision": 0.8207830064366348, + "recall": 0.8190103491435802, + "support": 29841.0 + }, + "eval_runtime": 4.7863, + "eval_samples_per_second": 16.714, + "eval_steps_per_second": 2.089, "eval_weighted avg": { - "f1-score": 0.8594198025832774, - "precision": 0.8602837119208202, - "recall": 0.8588425818818786, - "support": 30257.0 + "f1-score": 0.8572909864340814, + "precision": 0.8574881471703532, + "recall": 0.8571428571428571, + "support": 29841.0 }, "step": 3888 } @@ -2223,7 +2223,7 @@ "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, - "total_flos": 6880424825635200.0, + "total_flos": 6901859170886400.0, "train_batch_size": 4, "trial_name": null, "trial_params": null