diff --git "a/checkpoint-3888/trainer_state.json" "b/checkpoint-3888/trainer_state.json" --- "a/checkpoint-3888/trainer_state.json" +++ "b/checkpoint-3888/trainer_state.json" @@ -11,2209 +11,2209 @@ { "epoch": 1.0, "eval_Claim": { - "f1-score": 0.38183790485045715, - "precision": 0.6497890295358649, - "recall": 0.27035330261136714, - "support": 4557.0 + "f1-score": 0.4888068880688806, + "precision": 0.6228840125391849, + "recall": 0.40222672064777326, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.6266258607498087, - "precision": 0.5535653937140926, - "recall": 0.7219039224327898, - "support": 2269.0 + "f1-score": 0.7325278370054489, + "precision": 0.7604525332021643, + "recall": 0.706581352833638, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8545803971812939, - "precision": 0.8443037974683544, - "recall": 0.8651102464332037, - "support": 8481.0 + "f1-score": 0.8634848138844484, + "precision": 0.827613377692173, + "recall": 0.902606702950444, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.878949075575738, - "precision": 0.8314310260186549, - "recall": 0.9322278794550709, - "support": 14534.0 + "f1-score": 0.8792819197655248, + "precision": 0.8543458914268763, + "recall": 0.9057173407132524, + "support": 15899.0 }, - "eval_accuracy": 0.7960859220535504, - "eval_loss": 0.5359914898872375, + "eval_accuracy": 0.8174925373134329, + "eval_loss": 0.49806877970695496, "eval_macro avg": { - "f1-score": 0.6854983095893245, - "precision": 0.7197723116842417, - "recall": 0.697398837733108, - "support": 29841.0 - }, - "eval_runtime": 4.8191, - "eval_samples_per_second": 16.601, - "eval_steps_per_second": 2.075, + "f1-score": 0.7410253646810757, + "precision": 0.7663239537150996, + "recall": 0.7292830292862769, + "support": 33500.0 + }, + "eval_runtime": 4.9194, + "eval_samples_per_second": 16.465, + "eval_steps_per_second": 2.236, "eval_weighted avg": { - "f1-score": 0.7769240850962494, - "precision": 0.7862232339538372, - "recall": 0.7960859220535504, - "support": 29841.0 + "f1-score": 0.8071778099281224, + "precision": 0.80572410140167, + "recall": 0.8174925373134329, + "support": 33500.0 }, "step": 81 }, { "epoch": 2.0, "eval_Claim": { - "f1-score": 0.6161300742974051, - "precision": 0.6048625792811839, - "recall": 0.6278253236778583, - "support": 4557.0 + "f1-score": 0.5993816254416962, + "precision": 0.6593780369290574, + "recall": 0.5493927125506073, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.7920215150156881, - "precision": 0.8057455540355677, - "recall": 0.7787571617452622, - "support": 2269.0 + "f1-score": 0.8017817371937639, + "precision": 0.7197382769901853, + "recall": 0.9049360146252285, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8922796352583586, - "precision": 0.9209436566695947, - "recall": 0.865346067680698, - "support": 8481.0 + "f1-score": 0.9058997050147494, + "precision": 0.9337184554575859, + "recall": 0.8796906330564308, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8914289590611538, - "precision": 0.8790554552143957, - "recall": 0.9041557726709784, - "support": 14534.0 + "f1-score": 0.8854737486606459, + "precision": 0.862579028987236, + "recall": 0.9096169570413234, + "support": 15899.0 }, - "eval_accuracy": 0.8413927147213566, - "eval_loss": 0.443877637386322, + "eval_accuracy": 0.8468358208955223, + "eval_loss": 0.4562840759754181, "eval_macro avg": { - "f1-score": 0.7979650459081514, - "precision": 0.8026518113001855, - "recall": 0.7940210814436992, - "support": 29841.0 - }, - "eval_runtime": 4.8087, - "eval_samples_per_second": 16.637, - "eval_steps_per_second": 2.08, + "f1-score": 0.7981342040777137, + "precision": 0.7938534495910161, + "recall": 0.8109090793183975, + "support": 33500.0 + }, + "eval_runtime": 4.904, + "eval_samples_per_second": 16.517, + "eval_steps_per_second": 2.243, "eval_weighted avg": { - "f1-score": 0.842071433389123, - "precision": 0.8435143116581857, - "recall": 0.8413927147213566, - "support": 29841.0 + "f1-score": 0.8442053257085675, + "precision": 0.8455251408465503, + "recall": 0.8468358208955223, + "support": 33500.0 }, "step": 162 }, { "epoch": 3.0, "eval_Claim": { - "f1-score": 0.6042799305957202, - "precision": 0.6389432485322897, - "recall": 0.5731841123546193, - "support": 4557.0 + "f1-score": 0.6235462150581514, + "precision": 0.6285479226655697, + "recall": 0.6186234817813765, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8349557522123894, - "precision": 0.8382940915148823, - "recall": 0.8316438959894227, - "support": 2269.0 + "f1-score": 0.8338848444738584, + "precision": 0.8059701492537313, + "recall": 0.8638025594149908, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8941106484235574, - "precision": 0.9022691799735862, - "recall": 0.8860983374602052, - "support": 8481.0 + "f1-score": 0.9066250826953974, + "precision": 0.8974646833193002, + "recall": 0.9159744103886184, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8917763490086511, - "precision": 0.8729980887102089, - "recall": 0.9113802119168846, - "support": 14534.0 + "f1-score": 0.8827730692315017, + "precision": 0.8911176621379133, + "recall": 0.8745833071262343, + "support": 15899.0 }, - "eval_accuracy": 0.8464863778023525, - "eval_loss": 0.4555923044681549, + "eval_accuracy": 0.8490746268656716, + "eval_loss": 0.43820467591285706, "eval_macro avg": { - "f1-score": 0.8062806700600795, - "precision": 0.8131261521827418, - "recall": 0.8005766394302829, - "support": 29841.0 - }, - "eval_runtime": 4.7811, - "eval_samples_per_second": 16.733, - "eval_steps_per_second": 2.092, + "f1-score": 0.8117073028647273, + "precision": 0.8057751043441286, + "recall": 0.818245939677805, + "support": 33500.0 + }, + "eval_runtime": 4.9179, + "eval_samples_per_second": 16.47, + "eval_steps_per_second": 2.237, "eval_weighted avg": { - "f1-score": 0.8442159482345275, - "precision": 0.8429359878649869, - "recall": 0.8464863778023525, - "support": 29841.0 + "f1-score": 0.8488105033097496, + "precision": 0.8488213959184715, + "recall": 0.8490746268656716, + "support": 33500.0 }, "step": 243 }, { "epoch": 4.0, "eval_Claim": { - "f1-score": 0.6278026905829596, - "precision": 0.5981717011128775, - "recall": 0.6605222734254992, - "support": 4557.0 + "f1-score": 0.6415287144900879, + "precision": 0.6477507222451506, + "recall": 0.6354251012145749, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8182207014542344, - "precision": 0.7947652679684254, - "recall": 0.8431026884089907, - "support": 2269.0 + "f1-score": 0.8005126014523707, + "precision": 0.7514033680834001, + "recall": 0.856489945155393, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9069328626209752, - "precision": 0.9373427277302466, - "recall": 0.8784341469166372, - "support": 8481.0 + "f1-score": 0.9065169636319258, + "precision": 0.9273871354374751, + "recall": 0.8865654540246348, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.888919552918449, - "precision": 0.8913795489137954, - "recall": 0.8864730975643319, - "support": 14534.0 + "f1-score": 0.8932505382719131, + "precision": 0.8863636363636364, + "recall": 0.9002452984464432, + "support": 15899.0 }, - "eval_accuracy": 0.8463858449783854, - "eval_loss": 0.4377317428588867, + "eval_accuracy": 0.8540597014925373, + "eval_loss": 0.4749625325202942, "eval_macro avg": { - "f1-score": 0.8104689518941546, - "precision": 0.8054148114313363, - "recall": 0.8171330515788647, - "support": 29841.0 - }, - "eval_runtime": 4.8109, - "eval_samples_per_second": 16.629, - "eval_steps_per_second": 2.079, + "f1-score": 0.8104522044615743, + "precision": 0.8032262155324155, + "recall": 0.8196814497102615, + "support": 33500.0 + }, + "eval_runtime": 4.8972, + "eval_samples_per_second": 16.54, + "eval_steps_per_second": 2.246, "eval_weighted avg": { - "f1-score": 0.8487883791626096, - "precision": 0.8523207959781866, - "recall": 0.8463858449783854, - "support": 29841.0 + "f1-score": 0.8542213698406307, + "precision": 0.8551874645146165, + "recall": 0.8540597014925373, + "support": 33500.0 }, "step": 324 }, { "epoch": 5.0, "eval_Claim": { - "f1-score": 0.6247990569070839, - "precision": 0.6105990783410138, - "recall": 0.6396752249286811, - "support": 4557.0 + "f1-score": 0.6099687080911935, + "precision": 0.6808882235528942, + "recall": 0.5524291497975709, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.7998289136013687, - "precision": 0.7769007062733694, - "recall": 0.8241516086381666, - "support": 2269.0 + "f1-score": 0.8315018315018317, + "precision": 0.8330275229357799, + "recall": 0.829981718464351, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9028039585296891, - "precision": 0.9020600353148911, - "recall": 0.9035491097747907, - "support": 8481.0 + "f1-score": 0.9103454839630722, + "precision": 0.9074091642159188, + "recall": 0.9133008689009835, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8885327014878567, - "precision": 0.9001058948111542, - "recall": 0.8772533370028898, - "support": 14534.0 + "f1-score": 0.8913988368533824, + "precision": 0.8682249120505635, + "recall": 0.915843763758727, + "support": 15899.0 }, - "eval_accuracy": 0.8444086994403672, - "eval_loss": 0.5236712694168091, + "eval_accuracy": 0.8558507462686568, + "eval_loss": 0.5162495374679565, "eval_macro avg": { - "f1-score": 0.8039911576314996, - "precision": 0.7974164286851071, - "recall": 0.8111573200861321, - "support": 29841.0 - }, - "eval_runtime": 4.8153, - "eval_samples_per_second": 16.614, - "eval_steps_per_second": 2.077, + "f1-score": 0.8108037151023699, + "precision": 0.8223874556887891, + "recall": 0.8028888752304081, + "support": 33500.0 + }, + "eval_runtime": 4.9413, + "eval_samples_per_second": 16.392, + "eval_steps_per_second": 2.226, "eval_weighted avg": { - "f1-score": 0.8455693764619782, - "precision": 0.8470828034323642, - "recall": 0.8444086994403672, - "support": 29841.0 + "f1-score": 0.8519095458499607, + "precision": 0.8505509283002989, + "recall": 0.8558507462686568, + "support": 33500.0 }, "step": 405 }, { "epoch": 6.0, "eval_Claim": { - "f1-score": 0.6166529266281945, - "precision": 0.5813095006800078, - "recall": 0.6565723063418916, - "support": 4557.0 + "f1-score": 0.646279703934554, + "precision": 0.6227477477477478, + "recall": 0.6716599190283401, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8074107959743824, - "precision": 0.8392772230147408, - "recall": 0.7778757161745262, - "support": 2269.0 + "f1-score": 0.8414067684140676, + "precision": 0.8152593227603944, + "recall": 0.8692870201096892, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8913107165875667, - "precision": 0.8858607034707664, - "recall": 0.8968282042212004, - "support": 8481.0 + "f1-score": 0.9112506693929215, + "precision": 0.9295788637266588, + "recall": 0.8936312422419556, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8815305371596762, - "precision": 0.8981792217065334, - "recall": 0.865487821659557, - "support": 14534.0 + "f1-score": 0.8861383012314494, + "precision": 0.8897343224906474, + "recall": 0.8825712308950249, + "support": 15899.0 }, - "eval_accuracy": 0.8358298984618477, - "eval_loss": 0.5537309050559998, + "eval_accuracy": 0.8540597014925373, + "eval_loss": 0.552895724773407, "eval_macro avg": { - "f1-score": 0.7992262440874549, - "precision": 0.8011566622180121, - "recall": 0.7991910120992938, - "support": 29841.0 - }, - "eval_runtime": 4.7996, - "eval_samples_per_second": 16.668, - "eval_steps_per_second": 2.084, + "f1-score": 0.8212688607432481, + "precision": 0.8143300641813621, + "recall": 0.8292873530687525, + "support": 33500.0 + }, + "eval_runtime": 4.9336, + "eval_samples_per_second": 16.418, + "eval_steps_per_second": 2.23, "eval_weighted avg": { - "f1-score": 0.838225042631562, - "precision": 0.8418105575563007, - "recall": 0.8358298984618477, - "support": 29841.0 + "f1-score": 0.8556973390614198, + "precision": 0.8579560210496036, + "recall": 0.8540597014925373, + "support": 33500.0 }, "step": 486 }, { "epoch": 6.17, - "grad_norm": 6.804128646850586, + "grad_norm": 9.790245056152344, "learning_rate": 1.7530864197530865e-05, - "loss": 0.3426, + "loss": 0.3328, "step": 500 }, { "epoch": 7.0, "eval_Claim": { - "f1-score": 0.6206536493682782, - "precision": 0.5920318725099601, - "recall": 0.652183454026772, - "support": 4557.0 + "f1-score": 0.6202600808654791, + "precision": 0.6739491807171694, + "recall": 0.5744939271255061, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8364370652905541, - "precision": 0.8519195612431444, - "recall": 0.8215072719259586, - "support": 2269.0 + "f1-score": 0.8670041417395307, + "precision": 0.8730305838739574, + "recall": 0.8610603290676416, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9008658773634918, - "precision": 0.9000706214689266, - "recall": 0.9016625397948355, - "support": 8481.0 + "f1-score": 0.9109892729439809, + "precision": 0.9097314797181489, + "recall": 0.9122505490308412, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8854242963272995, - "precision": 0.8978566881233642, - "recall": 0.8733314985551122, - "support": 14534.0 + "f1-score": 0.8872356123954747, + "precision": 0.8677611401767996, + "recall": 0.9076042518397384, + "support": 15899.0 }, - "eval_accuracy": 0.8436714587312758, - "eval_loss": 0.5738794207572937, + "eval_accuracy": 0.8568955223880597, + "eval_loss": 0.5894299149513245, "eval_macro avg": { - "f1-score": 0.8108452220874058, - "precision": 0.8104696858363488, - "recall": 0.8121711910756696, - "support": 29841.0 - }, - "eval_runtime": 4.8167, - "eval_samples_per_second": 16.609, - "eval_steps_per_second": 2.076, + "f1-score": 0.8213722769861164, + "precision": 0.8311180961215189, + "recall": 0.8138522642659318, + "support": 33500.0 + }, + "eval_runtime": 4.9037, + "eval_samples_per_second": 16.518, + "eval_steps_per_second": 2.243, "eval_weighted avg": { - "f1-score": 0.8456551258354699, - "precision": 0.8482906998207675, - "recall": 0.8436714587312758, - "support": 29841.0 + "f1-score": 0.8539713289140156, + "precision": 0.8526463291050193, + "recall": 0.8568955223880597, + "support": 33500.0 }, "step": 567 }, { "epoch": 8.0, "eval_Claim": { - "f1-score": 0.6410105757931845, - "precision": 0.5787798408488064, - "recall": 0.7182356813693219, - "support": 4557.0 + "f1-score": 0.6441500279902966, + "precision": 0.5974385600553825, + "recall": 0.6987854251012146, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8115942028985507, - "precision": 0.8804123711340206, - "recall": 0.75275451740855, - "support": 2269.0 + "f1-score": 0.834510811389424, + "precision": 0.7849375755134917, + "recall": 0.8907678244972578, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8960937967338637, - "precision": 0.9094220495386109, - "recall": 0.8831505718665251, - "support": 8481.0 + "f1-score": 0.9059161060546101, + "precision": 0.9398542543364466, + "recall": 0.874343550081161, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.891816143497758, - "precision": 0.9084939329050679, - "recall": 0.8757396449704142, - "support": 14534.0 + "f1-score": 0.8801401497053671, + "precision": 0.8915849251419721, + "recall": 0.8689854707843261, + "support": 15899.0 }, - "eval_accuracy": 0.8444422103816897, - "eval_loss": 0.5891872644424438, + "eval_accuracy": 0.8469850746268657, + "eval_loss": 0.5878348350524902, "eval_macro avg": { - "f1-score": 0.8101286797308392, - "precision": 0.8192770486066265, - "recall": 0.8074701039037029, - "support": 29841.0 - }, - "eval_runtime": 4.799, - "eval_samples_per_second": 16.67, - "eval_steps_per_second": 2.084, + "f1-score": 0.8161792737849245, + "precision": 0.8034538287618231, + "recall": 0.8332205676159898, + "support": 33500.0 + }, + "eval_runtime": 4.9086, + "eval_samples_per_second": 16.502, + "eval_steps_per_second": 2.241, "eval_weighted avg": { - "f1-score": 0.8486317402219317, - "precision": 0.8562720628608399, - "recall": 0.8444422103816897, - "support": 29841.0 + "f1-score": 0.8504184600736624, + "precision": 0.8563340964894008, + "recall": 0.8469850746268657, + "support": 33500.0 }, "step": 648 }, { "epoch": 9.0, "eval_Claim": { - "f1-score": 0.6284997910572503, - "precision": 0.5998005982053839, - "recall": 0.6600833881939873, - "support": 4557.0 + "f1-score": 0.6323094193285029, + "precision": 0.6375797489195307, + "recall": 0.6271255060728745, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.816712834718375, - "precision": 0.857489093553078, - "recall": 0.7796386073159982, - "support": 2269.0 + "f1-score": 0.8525914292124747, + "precision": 0.8373732921992068, + "recall": 0.8683729433272395, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8971996170416466, - "precision": 0.9108249301421455, - "recall": 0.8839759462327555, - "support": 8481.0 + "f1-score": 0.9054132151801194, + "precision": 0.9134194927606647, + "recall": 0.8975460708488494, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8942406935938898, - "precision": 0.8943022295623452, - "recall": 0.8941791660932985, - "support": 14534.0 + "f1-score": 0.8888055034396498, + "precision": 0.883775884584292, + "recall": 0.8938926976539405, + "support": 15899.0 }, - "eval_accuracy": 0.8468214872155759, - "eval_loss": 0.7009620070457458, + "eval_accuracy": 0.8540298507462687, + "eval_loss": 0.7043101191520691, "eval_macro avg": { - "f1-score": 0.8091632341027905, - "precision": 0.8156042128657381, - "recall": 0.8044692769590099, - "support": 29841.0 - }, - "eval_runtime": 4.8005, - "eval_samples_per_second": 16.665, - "eval_steps_per_second": 2.083, + "f1-score": 0.8197798917901866, + "precision": 0.8180371046159236, + "recall": 0.821734304475726, + "support": 33500.0 + }, + "eval_runtime": 4.935, + "eval_samples_per_second": 16.414, + "eval_steps_per_second": 2.229, "eval_weighted avg": { - "f1-score": 0.848605581671113, - "precision": 0.8512257939173797, - "recall": 0.8468214872155759, - "support": 29841.0 + "f1-score": 0.853808653145316, + "precision": 0.8537078167069386, + "recall": 0.8540298507462687, + "support": 33500.0 }, "step": 729 }, { "epoch": 10.0, "eval_Claim": { - "f1-score": 0.6189745836985101, - "precision": 0.6180266900021877, - "recall": 0.619925389510643, - "support": 4557.0 + "f1-score": 0.6347110795166041, + "precision": 0.6368453230079478, + "recall": 0.6325910931174089, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8208921766420085, - "precision": 0.8353102189781022, - "recall": 0.8069634200088145, - "support": 2269.0 + "f1-score": 0.8442090055381651, + "precision": 0.8921119592875318, + "recall": 0.8011882998171846, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8951902368987796, - "precision": 0.9085610200364299, - "recall": 0.8822072868765476, - "support": 8481.0 + "f1-score": 0.9106677408653618, + "precision": 0.9040270982310877, + "recall": 0.9174066647569942, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8963474827245805, - "precision": 0.8870174493027017, - "recall": 0.905875877253337, - "support": 14534.0 + "f1-score": 0.8841656478259506, + "precision": 0.881375, + "recall": 0.8869740235234921, + "support": 15899.0 }, - "eval_accuracy": 0.8479608592205355, - "eval_loss": 0.7416248917579651, + "eval_accuracy": 0.8533731343283583, + "eval_loss": 0.7164433002471924, "eval_macro avg": { - "f1-score": 0.8078511199909697, - "precision": 0.8122288445798553, - "recall": 0.8037429934123356, - "support": 29841.0 - }, - "eval_runtime": 4.7804, - "eval_samples_per_second": 16.735, - "eval_steps_per_second": 2.092, + "f1-score": 0.8184383684365204, + "precision": 0.8285898451316418, + "recall": 0.8095400203037699, + "support": 33500.0 + }, + "eval_runtime": 4.9093, + "eval_samples_per_second": 16.499, + "eval_steps_per_second": 2.241, "eval_weighted avg": { - "f1-score": 0.8479238041544329, - "precision": 0.8481312332795722, - "recall": 0.8479608592205355, - "support": 29841.0 + "f1-score": 0.8530559678148433, + "precision": 0.8530989190255094, + "recall": 0.8533731343283583, + "support": 33500.0 }, "step": 810 }, { "epoch": 11.0, "eval_Claim": { - "f1-score": 0.6350413962855225, - "precision": 0.6477973065510158, - "recall": 0.6227781435154707, - "support": 4557.0 + "f1-score": 0.645658668208538, + "precision": 0.6161486113665624, + "recall": 0.6781376518218624, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8403837767117314, - "precision": 0.8316788951230039, - "recall": 0.8492728074041428, - "support": 2269.0 + "f1-score": 0.8331177231565331, + "precision": 0.7885714285714286, + "recall": 0.8829981718464351, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9076665470637484, - "precision": 0.920883387938357, - "recall": 0.894823723617498, - "support": 8481.0 + "f1-score": 0.9059711059612445, + "precision": 0.9366843393148451, + "recall": 0.8772080588179128, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9016170675363501, - "precision": 0.8904844987250033, - "recall": 0.9130315123159488, - "support": 14534.0 + "f1-score": 0.8902977542265961, + "precision": 0.8929452704840241, + "recall": 0.8876658909365369, + "support": 15899.0 }, - "eval_accuracy": 0.8586843604436849, - "eval_loss": 0.753268837928772, + "eval_accuracy": 0.8531940298507462, + "eval_loss": 0.7852362394332886, "eval_macro avg": { - "f1-score": 0.8211771968993381, - "precision": 0.822711022084345, - "recall": 0.8199765467132651, - "support": 29841.0 - }, - "eval_runtime": 4.7829, - "eval_samples_per_second": 16.726, - "eval_steps_per_second": 2.091, + "f1-score": 0.818761312888228, + "precision": 0.8085874124342151, + "recall": 0.8315024433556868, + "support": 33500.0 + }, + "eval_runtime": 4.89, + "eval_samples_per_second": 16.565, + "eval_steps_per_second": 2.25, "eval_weighted avg": { - "f1-score": 0.8579718131916827, - "precision": 0.8575920866110881, - "recall": 0.8586843604436849, - "support": 29841.0 + "f1-score": 0.8553879040715653, + "precision": 0.8589850855801485, + "recall": 0.8531940298507462, + "support": 33500.0 }, "step": 891 }, { "epoch": 12.0, "eval_Claim": { - "f1-score": 0.6230640668523677, - "precision": 0.6328655500226347, - "recall": 0.6135615536537196, - "support": 4557.0 + "f1-score": 0.6329215627196947, + "precision": 0.6280645804265498, + "recall": 0.6378542510121458, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.837270341207349, - "precision": 0.8310898827616153, - "recall": 0.8435434111943587, - "support": 2269.0 + "f1-score": 0.8528368794326241, + "precision": 0.8278829604130808, + "recall": 0.8793418647166362, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8982022214588343, - "precision": 0.8730105731775181, - "recall": 0.9248909326730338, - "support": 8481.0 + "f1-score": 0.9126755145220234, + "precision": 0.9193064031773709, + "recall": 0.9061395970591044, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8888346297394397, - "precision": 0.9013795542978422, - "recall": 0.8766340993532407, - "support": 14534.0 + "f1-score": 0.8876634630534112, + "precision": 0.8894291487749432, + "recall": 0.88590477388515, + "support": 15899.0 }, - "eval_accuracy": 0.8476592607486344, - "eval_loss": 0.8125314712524414, + "eval_accuracy": 0.8552238805970149, + "eval_loss": 0.8324545621871948, "eval_macro avg": { - "f1-score": 0.8118428148144977, - "precision": 0.8095863900649026, - "recall": 0.8146574992185882, - "support": 29841.0 - }, - "eval_runtime": 4.7824, - "eval_samples_per_second": 16.728, - "eval_steps_per_second": 2.091, + "f1-score": 0.8215243549319383, + "precision": 0.8161707731979861, + "recall": 0.827310121668259, + "support": 33500.0 + }, + "eval_runtime": 4.8939, + "eval_samples_per_second": 16.551, + "eval_steps_per_second": 2.248, "eval_weighted avg": { - "f1-score": 0.846990546753497, - "precision": 0.8469677413197487, - "recall": 0.8476592607486344, - "support": 29841.0 + "f1-score": 0.8556433335734092, + "precision": 0.8562082669116539, + "recall": 0.8552238805970149, + "support": 33500.0 }, "step": 972 }, { "epoch": 12.35, - "grad_norm": 15.335172653198242, + "grad_norm": 2.6090729236602783, "learning_rate": 1.506172839506173e-05, - "loss": 0.061, + "loss": 0.0589, "step": 1000 }, { "epoch": 13.0, "eval_Claim": { - "f1-score": 0.6158673240699238, - "precision": 0.6292649416075109, - "recall": 0.6030283080974326, - "support": 4557.0 + "f1-score": 0.6431152147731835, + "precision": 0.6377388535031847, + "recall": 0.648582995951417, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8147180492053124, - "precision": 0.8050774526678142, - "recall": 0.8245923314235346, - "support": 2269.0 + "f1-score": 0.8326953388876379, + "precision": 0.8206835330670218, + "recall": 0.8450639853747715, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9060346875742457, - "precision": 0.9128665469778575, - "recall": 0.8993043273198915, - "support": 8481.0 + "f1-score": 0.904438383337466, + "precision": 0.9408790755262072, + "recall": 0.8707151723479424, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9008830850011933, - "precision": 0.8929368029739777, - "recall": 0.9089720655015825, - "support": 14534.0 + "f1-score": 0.892013567684243, + "precision": 0.8749621922448733, + "recall": 0.9097427511164224, + "support": 15899.0 }, - "eval_accuracy": 0.8530880332428538, - "eval_loss": 0.8537381887435913, + "eval_accuracy": 0.8548059701492537, + "eval_loss": 0.8543176651000977, "eval_macro avg": { - "f1-score": 0.8093757864626687, - "precision": 0.8100364360567901, - "recall": 0.8089742580856103, - "support": 29841.0 - }, - "eval_runtime": 4.7933, - "eval_samples_per_second": 16.69, - "eval_steps_per_second": 2.086, + "f1-score": 0.8180656261706326, + "precision": 0.8185659135853218, + "recall": 0.8185262261976383, + "support": 33500.0 + }, + "eval_runtime": 4.9338, + "eval_samples_per_second": 16.417, + "eval_steps_per_second": 2.23, "eval_weighted avg": { - "f1-score": 0.8522709558043637, - "precision": 0.8516552983596964, - "recall": 0.8530880332428538, - "support": 29841.0 + "f1-score": 0.8553204019036041, + "precision": 0.8570428644520474, + "recall": 0.8548059701492537, + "support": 33500.0 }, "step": 1053 }, { "epoch": 14.0, "eval_Claim": { - "f1-score": 0.6346033728919426, - "precision": 0.6036838978015449, - "recall": 0.6688610928242265, - "support": 4557.0 + "f1-score": 0.6541843971631205, + "precision": 0.6138420585625555, + "recall": 0.7002024291497976, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8067737733391228, - "precision": 0.7950363714163458, - "recall": 0.8188629352137505, - "support": 2269.0 + "f1-score": 0.8336528221512247, + "precision": 0.7806142800159553, + "recall": 0.8944241316270567, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9004597838418822, - "precision": 0.9121703363174449, - "recall": 0.8890461030538852, - "support": 8481.0 + "f1-score": 0.9079845651528643, + "precision": 0.9421004003695719, + "recall": 0.8762532225723288, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8921770010096438, - "precision": 0.903023468884347, - "recall": 0.8815880005504335, - "support": 14534.0 + "f1-score": 0.889389516436096, + "precision": 0.8974194787731319, + "recall": 0.8815019812566828, + "support": 15899.0 }, - "eval_accuracy": 0.8464528668610302, - "eval_loss": 0.9449928998947144, + "eval_accuracy": 0.8539701492537314, + "eval_loss": 0.9095103144645691, "eval_macro avg": { - "f1-score": 0.8085034827706478, - "precision": 0.8034785186049206, - "recall": 0.8145895329105739, - "support": 29841.0 - }, - "eval_runtime": 4.8154, - "eval_samples_per_second": 16.613, - "eval_steps_per_second": 2.077, + "f1-score": 0.8213028252258264, + "precision": 0.8084940544303038, + "recall": 0.8380954411514664, + "support": 33500.0 + }, + "eval_runtime": 4.8917, + "eval_samples_per_second": 16.559, + "eval_steps_per_second": 2.249, "eval_weighted avg": { - "f1-score": 0.8487033685671466, - "precision": 0.8517001698367573, - "recall": 0.8464528668610302, - "support": 29841.0 + "f1-score": 0.8568784946124219, + "precision": 0.8619418985092084, + "recall": 0.8539701492537314, + "support": 33500.0 }, "step": 1134 }, { "epoch": 15.0, "eval_Claim": { - "f1-score": 0.6062717770034843, - "precision": 0.5687367813881946, - "recall": 0.6491112574061882, - "support": 4557.0 + "f1-score": 0.631984585741811, + "precision": 0.6332046332046332, + "recall": 0.6307692307692307, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8176843948347561, - "precision": 0.8121739130434783, - "recall": 0.8232701630674306, - "support": 2269.0 + "f1-score": 0.8264781491002571, + "precision": 0.7778225806451613, + "recall": 0.8816270566727605, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8942823803967327, - "precision": 0.8850906571197598, - "recall": 0.9036670203985379, - "support": 8481.0 + "f1-score": 0.8970963775654971, + "precision": 0.8886910896655111, + "recall": 0.9056621789363124, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.877618288144604, - "precision": 0.9049777063080184, - "recall": 0.8518645933672767, - "support": 14534.0 + "f1-score": 0.8838946528332003, + "precision": 0.8974458706080644, + "recall": 0.8707465878357129, + "support": 15899.0 }, - "eval_accuracy": 0.8334506216279616, - "eval_loss": 1.0531803369522095, + "eval_accuracy": 0.8469850746268657, + "eval_loss": 0.9576827883720398, "eval_macro avg": { - "f1-score": 0.7989642100948944, - "precision": 0.7927447644648628, - "recall": 0.8069782585598584, - "support": 29841.0 - }, - "eval_runtime": 4.774, - "eval_samples_per_second": 16.757, - "eval_steps_per_second": 2.095, + "f1-score": 0.8098634413101913, + "precision": 0.7992910435308425, + "recall": 0.8222012635535042, + "support": 33500.0 + }, + "eval_runtime": 4.8883, + "eval_samples_per_second": 16.57, + "eval_steps_per_second": 2.25, "eval_weighted avg": { - "f1-score": 0.8363600230462553, - "precision": 0.8409220859889104, - "recall": 0.8334506216279616, - "support": 29841.0 + "f1-score": 0.8471244624308779, + "precision": 0.8479301603984184, + "recall": 0.8469850746268657, + "support": 33500.0 }, "step": 1215 }, { "epoch": 16.0, "eval_Claim": { - "f1-score": 0.6349479110729246, - "precision": 0.6217921750105174, - "recall": 0.6486723721746763, - "support": 4557.0 + "f1-score": 0.6332942805410586, + "precision": 0.6682400539447066, + "recall": 0.6018218623481781, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8260292164674634, - "precision": 0.8297020898176968, - "recall": 0.8223887174966946, - "support": 2269.0 + "f1-score": 0.8478211270819075, + "precision": 0.8464692482915718, + "recall": 0.8491773308957953, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9045516104339634, - "precision": 0.9034344860032933, - "recall": 0.9056715010022403, - "support": 8481.0 + "f1-score": 0.9089773764349872, + "precision": 0.9145563502803016, + "recall": 0.9034660555714695, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8956702459300312, - "precision": 0.90185546875, - "recall": 0.8895692858125774, - "support": 14534.0 + "f1-score": 0.8924681415656145, + "precision": 0.8759539672925499, + "recall": 0.9096169570413234, + "support": 15899.0 }, - "eval_accuracy": 0.8522502597097953, - "eval_loss": 0.9694080352783203, + "eval_accuracy": 0.8583582089552239, + "eval_loss": 0.9394893646240234, "eval_macro avg": { - "f1-score": 0.8152997459760956, - "precision": 0.8141960548953769, - "recall": 0.8165754691215471, - "support": 29841.0 - }, - "eval_runtime": 4.7829, - "eval_samples_per_second": 16.726, - "eval_steps_per_second": 2.091, + "f1-score": 0.8206402314058919, + "precision": 0.8263049049522826, + "recall": 0.8160205514641916, + "support": 33500.0 + }, + "eval_runtime": 4.896, + "eval_samples_per_second": 16.544, + "eval_steps_per_second": 2.247, "eval_weighted avg": { - "f1-score": 0.8530843968151707, - "precision": 0.854049671322198, - "recall": 0.8522502597097953, - "support": 29841.0 + "f1-score": 0.8564948483009961, + "precision": 0.8554663093796615, + "recall": 0.8583582089552239, + "support": 33500.0 }, "step": 1296 }, { "epoch": 17.0, "eval_Claim": { - "f1-score": 0.6241452751933639, - "precision": 0.6379468377635197, - "recall": 0.6109282422646478, - "support": 4557.0 + "f1-score": 0.6431561322729175, + "precision": 0.6657279029462738, + "recall": 0.6220647773279352, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8151592652871426, - "precision": 0.8626968503937008, - "recall": 0.7725870427501101, - "support": 2269.0 + "f1-score": 0.8454073572556984, + "precision": 0.8350423539901917, + "recall": 0.8560329067641682, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9064921025764218, - "precision": 0.9237454100367197, - "recall": 0.8898714774201155, - "support": 8481.0 + "f1-score": 0.909496556407023, + "precision": 0.9241991128634796, + "recall": 0.8952544638594481, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8993928008319636, - "precision": 0.8775777414075286, - "recall": 0.9223200770606853, - "support": 14534.0 + "f1-score": 0.8953850902917116, + "precision": 0.8791828322017459, + "recall": 0.9121957355808541, + "support": 15899.0 }, - "eval_accuracy": 0.8541603833651688, - "eval_loss": 0.985948920249939, + "eval_accuracy": 0.8604477611940299, + "eval_loss": 0.9581068754196167, "eval_macro avg": { - "f1-score": 0.8112973609722229, - "precision": 0.8254917099003672, - "recall": 0.7989267098738898, - "support": 29841.0 - }, - "eval_runtime": 4.7769, - "eval_samples_per_second": 16.747, - "eval_steps_per_second": 2.093, + "f1-score": 0.8233612840568376, + "precision": 0.8260380505004228, + "recall": 0.8213869708831014, + "support": 33500.0 + }, + "eval_runtime": 4.8973, + "eval_samples_per_second": 16.54, + "eval_steps_per_second": 2.246, "eval_weighted avg": { - "f1-score": 0.8529727851357218, - "precision": 0.85297351326598, - "recall": 0.8541603833651688, - "support": 29841.0 + "f1-score": 0.859338136623951, + "precision": 0.8588965274411914, + "recall": 0.8604477611940299, + "support": 33500.0 }, "step": 1377 }, { "epoch": 18.0, "eval_Claim": { - "f1-score": 0.638718890248878, - "precision": 0.5967219363445778, - "recall": 0.6870748299319728, - "support": 4557.0 + "f1-score": 0.6493941483597675, + "precision": 0.632508155824218, + "recall": 0.6672064777327935, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.778357854769815, - "precision": 0.8431876606683805, - "recall": 0.7227853680035258, - "support": 2269.0 + "f1-score": 0.8654810761513908, + "precision": 0.8635122838944495, + "recall": 0.8674588665447898, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9013165698019214, - "precision": 0.9066937119675457, - "recall": 0.8960028298549699, - "support": 8481.0 + "f1-score": 0.9125304729400293, + "precision": 0.9323503038756601, + "recall": 0.8935357586173971, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8934796194708702, - "precision": 0.9018082422203533, - "recall": 0.885303426448328, - "support": 14534.0 + "f1-score": 0.8928739085531874, + "precision": 0.8885635978572318, + "recall": 0.8972262406440656, + "support": 15899.0 }, - "eval_accuracy": 0.8457156261519386, - "eval_loss": 0.9986578822135925, + "eval_accuracy": 0.8602089552238806, + "eval_loss": 0.9848275184631348, "eval_macro avg": { - "f1-score": 0.8029682335728712, - "precision": 0.8121028878002143, - "recall": 0.7977916135596992, - "support": 29841.0 - }, - "eval_runtime": 4.7848, - "eval_samples_per_second": 16.719, - "eval_steps_per_second": 2.09, + "f1-score": 0.8300699015010937, + "precision": 0.8292335853628898, + "recall": 0.8313568358847614, + "support": 33500.0 + }, + "eval_runtime": 4.9301, + "eval_samples_per_second": 16.43, + "eval_steps_per_second": 2.231, "eval_weighted avg": { - "f1-score": 0.8480491462490054, - "precision": 0.8521498954326654, - "recall": 0.8457156261519386, - "support": 29841.0 + "f1-score": 0.8613257791852104, + "precision": 0.8628576878135704, + "recall": 0.8602089552238806, + "support": 33500.0 }, "step": 1458 }, { "epoch": 18.52, - "grad_norm": 11.437110900878906, + "grad_norm": 1.7008241415023804, "learning_rate": 1.2592592592592593e-05, - "loss": 0.0189, + "loss": 0.0216, "step": 1500 }, { "epoch": 19.0, "eval_Claim": { - "f1-score": 0.6127094530509011, - "precision": 0.5894160583941606, - "recall": 0.6379196840026333, - "support": 4557.0 + "f1-score": 0.6404391582799633, + "precision": 0.6432509699816213, + "recall": 0.6376518218623481, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.800753453327752, - "precision": 0.762455161418892, - "recall": 0.8431026884089907, - "support": 2269.0 + "f1-score": 0.8286799195890104, + "precision": 0.8103975535168195, + "recall": 0.8478062157221207, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8959336706699994, - "precision": 0.9275435496086847, - "recall": 0.8664072632944229, - "support": 8481.0 + "f1-score": 0.9006844397645144, + "precision": 0.9029750479846449, + "recall": 0.898405423469875, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8912863642630635, - "precision": 0.8930100842657825, - "recall": 0.8895692858125774, - "support": 14534.0 + "f1-score": 0.8906363035888403, + "precision": 0.8907763936076507, + "recall": 0.8904962576262658, + "support": 15899.0 }, - "eval_accuracy": 0.8410240943668108, - "eval_loss": 1.0641764402389526, + "eval_accuracy": 0.8528955223880597, + "eval_loss": 1.0161080360412598, "eval_macro avg": { - "f1-score": 0.800170735327929, - "precision": 0.79310621342188, - "recall": 0.8092497303796561, - "support": 29841.0 - }, - "eval_runtime": 4.8048, - "eval_samples_per_second": 16.65, - "eval_steps_per_second": 2.081, + "f1-score": 0.8151099553055821, + "precision": 0.8118499912726841, + "recall": 0.8185899296701524, + "support": 33500.0 + }, + "eval_runtime": 4.8924, + "eval_samples_per_second": 16.556, + "eval_steps_per_second": 2.248, "eval_weighted avg": { - "f1-score": 0.8431820663618932, - "precision": 0.8465361465202841, - "recall": 0.8410240943668108, - "support": 29841.0 + "f1-score": 0.8528362935634777, + "precision": 0.8528394387556787, + "recall": 0.8528955223880597, + "support": 33500.0 }, "step": 1539 }, { "epoch": 20.0, "eval_Claim": { - "f1-score": 0.6346276257161044, - "precision": 0.6142945163277881, - "recall": 0.6563528637261357, - "support": 4557.0 + "f1-score": 0.650995688770273, + "precision": 0.6603498542274052, + "recall": 0.6419028340080971, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8171902268760908, - "precision": 0.8090712742980561, - "recall": 0.8254737769942706, - "support": 2269.0 + "f1-score": 0.8586199145875477, + "precision": 0.8447589562140646, + "recall": 0.8729433272394881, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9044396961063628, - "precision": 0.9106011712680769, - "recall": 0.8983610423299139, - "support": 8481.0 + "f1-score": 0.9104241552839684, + "precision": 0.913972286374134, + "recall": 0.9069034660555715, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.894879267277269, - "precision": 0.902519244226732, - "recall": 0.8873675519471584, - "support": 14534.0 + "f1-score": 0.8906836964688204, + "precision": 0.8866313493300093, + "recall": 0.894773256179634, + "support": 15899.0 }, - "eval_accuracy": 0.8505076907610335, - "eval_loss": 1.087249994277954, + "eval_accuracy": 0.8598507462686568, + "eval_loss": 0.9872655272483826, "eval_macro avg": { - "f1-score": 0.8127842039939568, - "precision": 0.8091215515301633, - "recall": 0.8168888087493696, - "support": 29841.0 - }, - "eval_runtime": 4.7799, - "eval_samples_per_second": 16.737, - "eval_steps_per_second": 2.092, + "f1-score": 0.8276808637776524, + "precision": 0.8264281115364033, + "recall": 0.8291307208706977, + "support": 33500.0 + }, + "eval_runtime": 4.9351, + "eval_samples_per_second": 16.413, + "eval_steps_per_second": 2.229, "eval_weighted avg": { - "f1-score": 0.85194635060675, - "precision": 0.8536961248417916, - "recall": 0.8505076907610335, - "support": 29841.0 + "f1-score": 0.8594158610175964, + "precision": 0.8590759538589217, + "recall": 0.8598507462686568, + "support": 33500.0 }, "step": 1620 }, { "epoch": 21.0, "eval_Claim": { - "f1-score": 0.6397356640375187, - "precision": 0.6219689119170985, - "recall": 0.6585472898836954, - "support": 4557.0 + "f1-score": 0.6439562566534404, + "precision": 0.6169108103096607, + "recall": 0.6734817813765183, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8133363574506692, - "precision": 0.8378504672897197, - "recall": 0.7902159541648304, - "support": 2269.0 + "f1-score": 0.8524001794526693, + "precision": 0.8370044052863436, + "recall": 0.8683729433272395, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9003324267150197, - "precision": 0.9236111111111112, - "recall": 0.8781983256691428, - "support": 8481.0 + "f1-score": 0.9078541717641301, + "precision": 0.9311383256374222, + "recall": 0.8857061014036093, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8964765215020788, - "precision": 0.8880637321091007, - "recall": 0.9050502270538049, - "support": 14534.0 + "f1-score": 0.8851262038144394, + "precision": 0.8857952755905512, + "recall": 0.8844581420215107, + "support": 15899.0 }, - "eval_accuracy": 0.8510438658221909, - "eval_loss": 1.093902826309204, + "eval_accuracy": 0.8526865671641791, + "eval_loss": 1.0280390977859497, "eval_macro avg": { - "f1-score": 0.8124702424263215, - "precision": 0.8178735556067575, - "recall": 0.8080029491928683, - "support": 29841.0 - }, - "eval_runtime": 4.813, - "eval_samples_per_second": 16.622, - "eval_steps_per_second": 2.078, + "f1-score": 0.8223342029211698, + "precision": 0.8177122042059943, + "recall": 0.8280047420322194, + "support": 33500.0 + }, + "eval_runtime": 4.9316, + "eval_samples_per_second": 16.425, + "eval_steps_per_second": 2.231, "eval_weighted avg": { - "f1-score": 0.8520439894961911, - "precision": 0.8537133191814482, - "recall": 0.8510438658221909, - "support": 29841.0 + "f1-score": 0.8545305598758789, + "precision": 0.8571336063495862, + "recall": 0.8526865671641791, + "support": 33500.0 }, "step": 1701 }, { "epoch": 22.0, "eval_Claim": { - "f1-score": 0.6279694722132645, - "precision": 0.6154656552886641, - "recall": 0.640991880623217, - "support": 4557.0 + "f1-score": 0.6535234899328859, + "precision": 0.6779808529155787, + "recall": 0.6307692307692307, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8173439463762043, - "precision": 0.7788423153692615, - "recall": 0.8598501542529748, - "support": 2269.0 + "f1-score": 0.8511305126483099, + "precision": 0.8341377797279509, + "recall": 0.8688299817184644, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9038883941822499, - "precision": 0.910210425633668, - "recall": 0.8976535785874308, - "support": 8481.0 + "f1-score": 0.9092228079508632, + "precision": 0.9212073696589572, + "recall": 0.8975460708488494, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8954102920723226, - "precision": 0.9051033319274567, - "recall": 0.8859226640979772, - "support": 14534.0 + "f1-score": 0.8968440594059406, + "precision": 0.882589367273613, + "recall": 0.9115667652053588, + "support": 15899.0 }, - "eval_accuracy": 0.849870982875909, - "eval_loss": 1.0930607318878174, + "eval_accuracy": 0.8629850746268657, + "eval_loss": 1.0620397329330444, "eval_macro avg": { - "f1-score": 0.8111530262110103, - "precision": 0.8024054320547626, - "recall": 0.8211045693904, - "support": 29841.0 - }, - "eval_runtime": 4.8038, - "eval_samples_per_second": 16.654, - "eval_steps_per_second": 2.082, + "f1-score": 0.8276802174844999, + "precision": 0.828978842394025, + "recall": 0.8271780121354758, + "support": 33500.0 + }, + "eval_runtime": 4.8953, + "eval_samples_per_second": 16.546, + "eval_steps_per_second": 2.247, "eval_weighted avg": { - "f1-score": 0.8510432276144315, - "precision": 0.8527239921837771, - "recall": 0.849870982875909, - "support": 29841.0 + "f1-score": 0.8618475752270865, + "precision": 0.8613257315871389, + "recall": 0.8629850746268657, + "support": 33500.0 }, "step": 1782 }, { "epoch": 23.0, "eval_Claim": { - "f1-score": 0.6225736879942487, - "precision": 0.5851351351351352, - "recall": 0.6651305683563749, - "support": 4557.0 + "f1-score": 0.6436781609195402, + "precision": 0.5858518764530056, + "recall": 0.71417004048583, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8058810995099083, - "precision": 0.7801155115511551, - "recall": 0.8334067871308947, - "support": 2269.0 + "f1-score": 0.8615044247787611, + "precision": 0.8349056603773585, + "recall": 0.8898537477148081, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.8976647945610404, - "precision": 0.9001659947830211, - "recall": 0.8951774554887395, - "support": 8481.0 + "f1-score": 0.9092565073582283, + "precision": 0.9129765113592607, + "recall": 0.905566695311754, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8881674136288245, - "precision": 0.9116858653915816, - "recall": 0.8658318425760286, - "support": 14534.0 + "f1-score": 0.873210033597547, + "precision": 0.9069657135113159, + "recall": 0.841876847600478, + "support": 15899.0 }, - "eval_accuracy": 0.8410576053081331, - "eval_loss": 1.1820006370544434, + "eval_accuracy": 0.846089552238806, + "eval_loss": 1.189612627029419, "eval_macro avg": { - "f1-score": 0.8035717489235055, - "precision": 0.7942756267152233, - "recall": 0.8148866633880094, - "support": 29841.0 - }, - "eval_runtime": 4.7901, - "eval_samples_per_second": 16.701, - "eval_steps_per_second": 2.088, + "f1-score": 0.8219122816635192, + "precision": 0.8101749404252352, + "recall": 0.8378668327782175, + "support": 33500.0 + }, + "eval_runtime": 4.9275, + "eval_samples_per_second": 16.438, + "eval_steps_per_second": 2.232, "eval_weighted avg": { - "f1-score": 0.8440512323089471, - "precision": 0.8485403664715132, - "recall": 0.8410576053081331, - "support": 29841.0 + "f1-score": 0.8498672096145845, + "precision": 0.8567860518556853, + "recall": 0.846089552238806, + "support": 33500.0 }, "step": 1863 }, { "epoch": 24.0, "eval_Claim": { - "f1-score": 0.6244661044792466, - "precision": 0.6233056405771753, - "recall": 0.6256308975202984, - "support": 4557.0 + "f1-score": 0.6632010396880935, + "precision": 0.6551451708473237, + "recall": 0.6714574898785425, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8177083333333335, - "precision": 0.8054724241128688, - "recall": 0.8303217276333187, - "support": 2269.0 + "f1-score": 0.84557309540151, + "precision": 0.8465414567109483, + "recall": 0.8446069469835467, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9007499414108273, - "precision": 0.8951904040992198, - "recall": 0.9063789647447235, - "support": 8481.0 + "f1-score": 0.911568570600174, + "precision": 0.922805987672439, + "recall": 0.9006015468347178, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8948225108225109, - "precision": 0.9008437347465309, - "recall": 0.888881243979634, - "support": 14534.0 + "f1-score": 0.8970938243768007, + "precision": 0.8933449759870268, + "recall": 0.9008742688219384, + "support": 15899.0 }, - "eval_accuracy": 0.8492007640494621, - "eval_loss": 1.1699731349945068, + "eval_accuracy": 0.8632835820895522, + "eval_loss": 1.108552098274231, "eval_macro avg": { - "f1-score": 0.8094367225114796, - "precision": 0.8062030508839487, - "recall": 0.8128032084694936, - "support": 29841.0 - }, - "eval_runtime": 4.802, - "eval_samples_per_second": 16.66, - "eval_steps_per_second": 2.082, + "f1-score": 0.8293591325166445, + "precision": 0.8294593978044343, + "recall": 0.8293850631296864, + "support": 33500.0 + }, + "eval_runtime": 4.9242, + "eval_samples_per_second": 16.449, + "eval_steps_per_second": 2.234, "eval_weighted avg": { - "f1-score": 0.8493576914930753, - "precision": 0.8496026739182283, - "recall": 0.8492007640494621, - "support": 29841.0 + "f1-score": 0.8637635648495541, + "precision": 0.864372798011359, + "recall": 0.8632835820895522, + "support": 33500.0 }, "step": 1944 }, { "epoch": 24.69, - "grad_norm": 9.07358169555664, + "grad_norm": 0.41564273834228516, "learning_rate": 1.0123456790123458e-05, - "loss": 0.006, + "loss": 0.0102, "step": 2000 }, { "epoch": 25.0, "eval_Claim": { - "f1-score": 0.622420524261015, - "precision": 0.632940108892922, - "recall": 0.6122448979591837, - "support": 4557.0 + "f1-score": 0.6543478260869565, + "precision": 0.6391891891891892, + "recall": 0.6702429149797571, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8149307107733571, - "precision": 0.8267573696145125, - "recall": 0.8034376377258704, - "support": 2269.0 + "f1-score": 0.8417964342134958, + "precision": 0.8314757021845742, + "recall": 0.8523765996343693, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9018776855612456, - "precision": 0.9004466384579219, - "recall": 0.9033132885272963, - "support": 8481.0 + "f1-score": 0.9077508785630614, + "precision": 0.9285072391412881, + "recall": 0.8879022247684523, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8975866548164354, - "precision": 0.8919157608695653, - "recall": 0.9033301224714463, - "support": 14534.0 + "f1-score": 0.8887081130127343, + "precision": 0.884198729921554, + "recall": 0.8932637272784452, + "support": 15899.0 }, - "eval_accuracy": 0.8512784424114473, - "eval_loss": 1.1391637325286865, + "eval_accuracy": 0.8560298507462687, + "eval_loss": 1.0723340511322021, "eval_macro avg": { - "f1-score": 0.8092038938530133, - "precision": 0.8130149694587304, - "recall": 0.8055814866709491, - "support": 29841.0 - }, - "eval_runtime": 4.83, - "eval_samples_per_second": 16.563, - "eval_steps_per_second": 2.07, + "f1-score": 0.8231508129690621, + "precision": 0.8208427151091513, + "recall": 0.8259463666652559, + "support": 33500.0 + }, + "eval_runtime": 4.8953, + "eval_samples_per_second": 16.546, + "eval_steps_per_second": 2.247, "eval_weighted avg": { - "f1-score": 0.8505008948811765, - "precision": 0.8498378793311306, - "recall": 0.8512784424114473, - "support": 29841.0 + "f1-score": 0.8570380328032566, + "precision": 0.8584774732395206, + "recall": 0.8560298507462687, + "support": 33500.0 }, "step": 2025 }, { "epoch": 26.0, "eval_Claim": { - "f1-score": 0.6216186854970125, - "precision": 0.6155335628227194, - "recall": 0.6278253236778583, - "support": 4557.0 + "f1-score": 0.6502824298880191, + "precision": 0.636963696369637, + "recall": 0.66417004048583, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8021786492374727, - "precision": 0.7931925894011203, - "recall": 0.8113706478624945, - "support": 2269.0 + "f1-score": 0.8458110516934045, + "precision": 0.8252173913043478, + "recall": 0.8674588665447898, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9000058854687776, - "precision": 0.8984723854289072, - "recall": 0.9015446291710884, - "support": 8481.0 + "f1-score": 0.912881895844394, + "precision": 0.9229943392543432, + "recall": 0.9029886374486775, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8959025470653377, - "precision": 0.9012672329759086, - "recall": 0.8906013485619926, - "support": 14534.0 + "f1-score": 0.8878304207936407, + "precision": 0.8905271151047269, + "recall": 0.8851500094345557, + "support": 15899.0 }, - "eval_accuracy": 0.8475587279246674, - "eval_loss": 1.18631911277771, + "eval_accuracy": 0.8569850746268657, + "eval_loss": 1.126774787902832, "eval_macro avg": { - "f1-score": 0.80492644181715, - "precision": 0.8021164426571639, - "recall": 0.8078354873183584, - "support": 29841.0 - }, - "eval_runtime": 4.7928, - "eval_samples_per_second": 16.692, - "eval_steps_per_second": 2.086, + "f1-score": 0.8242014495548646, + "precision": 0.8189256355082637, + "recall": 0.8299418884784633, + "support": 33500.0 + }, + "eval_runtime": 4.9541, + "eval_samples_per_second": 16.35, + "eval_steps_per_second": 2.22, "eval_weighted avg": { - "f1-score": 0.8480566079768785, - "precision": 0.848621115111045, - "recall": 0.8475587279246674, - "support": 29841.0 + "f1-score": 0.8578882907501019, + "precision": 0.8590204964268868, + "recall": 0.8569850746268657, + "support": 33500.0 }, "step": 2106 }, { "epoch": 27.0, "eval_Claim": { - "f1-score": 0.6274287012839449, - "precision": 0.6505655042412818, - "recall": 0.6058810621022602, - "support": 4557.0 + "f1-score": 0.6497180730042537, + "precision": 0.6353259818146644, + "recall": 0.6647773279352227, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8276779773785763, - "precision": 0.8330357142857143, - "recall": 0.8223887174966946, - "support": 2269.0 + "f1-score": 0.8471862491170237, + "precision": 0.8737251092763477, + "recall": 0.8222120658135283, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9055736912102527, - "precision": 0.9291651159905719, - "recall": 0.8831505718665251, - "support": 8481.0 + "f1-score": 0.9101418812401472, + "precision": 0.9107074569789675, + "recall": 0.9095770075432064, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8996312437143815, - "precision": 0.8772228033472803, - "recall": 0.9232145314435117, - "support": 14534.0 + "f1-score": 0.889659739522563, + "precision": 0.8921072603086264, + "recall": 0.8872256116736902, + "support": 15899.0 }, - "eval_accuracy": 0.8557018866659964, - "eval_loss": 1.173492431640625, + "eval_accuracy": 0.8571641791044776, + "eval_loss": 1.101758360862732, "eval_macro avg": { - "f1-score": 0.8150779033967888, - "precision": 0.8224972844662122, - "recall": 0.8086587207272479, - "support": 29841.0 - }, - "eval_runtime": 4.7958, - "eval_samples_per_second": 16.681, - "eval_steps_per_second": 2.085, + "f1-score": 0.824176485720997, + "precision": 0.8279664520946515, + "recall": 0.8209480032414119, + "support": 33500.0 + }, + "eval_runtime": 4.9026, + "eval_samples_per_second": 16.522, + "eval_steps_per_second": 2.244, "eval_weighted avg": { - "f1-score": 0.8542811867471567, - "precision": 0.8540126205927153, - "recall": 0.8557018866659964, - "support": 29841.0 + "f1-score": 0.8579064750628762, + "precision": 0.8588559229208557, + "recall": 0.8571641791044776, + "support": 33500.0 }, "step": 2187 }, { "epoch": 28.0, "eval_Claim": { - "f1-score": 0.6397700895324416, - "precision": 0.644543429844098, - "recall": 0.6350669299978056, - "support": 4557.0 + "f1-score": 0.6493561775034585, + "precision": 0.6845411711913844, + "recall": 0.6176113360323887, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8197434224831485, - "precision": 0.8090128755364807, - "recall": 0.8307624504186867, - "support": 2269.0 + "f1-score": 0.846973475402403, + "precision": 0.8403058929374719, + "recall": 0.8537477148080439, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9052350945225399, - "precision": 0.9310731646516266, - "recall": 0.8807923593915812, - "support": 8481.0 + "f1-score": 0.9125746196803388, + "precision": 0.9202835226721041, + "recall": 0.9049937935644037, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9018691588785046, - "precision": 0.8879183891185491, - "recall": 0.916265308930783, - "support": 14534.0 + "f1-score": 0.8957433682911783, + "precision": 0.8788814236426367, + "recall": 0.9132649852191962, + "support": 15899.0 }, - "eval_accuracy": 0.856740725846989, - "eval_loss": 1.153747797012329, + "eval_accuracy": 0.8631940298507462, + "eval_loss": 1.0291390419006348, "eval_macro avg": { - "f1-score": 0.8166544413541587, - "precision": 0.8181369647876886, - "recall": 0.815721762184714, - "support": 29841.0 - }, - "eval_runtime": 4.8135, - "eval_samples_per_second": 16.62, - "eval_steps_per_second": 2.077, + "f1-score": 0.8261619102193447, + "precision": 0.8310030026108993, + "recall": 0.8224044574060082, + "support": 33500.0 + }, + "eval_runtime": 4.895, + "eval_samples_per_second": 16.548, + "eval_steps_per_second": 2.247, "eval_weighted avg": { - "f1-score": 0.8565562586843419, - "precision": 0.8570179283955386, - "recall": 0.856740725846989, - "support": 29841.0 + "f1-score": 0.8614870234454082, + "precision": 0.8606473960260256, + "recall": 0.8631940298507462, + "support": 33500.0 }, "step": 2268 }, { "epoch": 29.0, "eval_Claim": { - "f1-score": 0.6479684334008745, - "precision": 0.6302904564315353, - "recall": 0.6666666666666666, - "support": 4557.0 + "f1-score": 0.6583255135022417, + "precision": 0.6787787572565039, + "recall": 0.6390688259109312, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8285593934288121, - "precision": 0.7934651068979427, - "recall": 0.8669017188188629, - "support": 2269.0 + "f1-score": 0.8515981735159819, + "precision": 0.8508211678832117, + "recall": 0.8523765996343693, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9062767649577879, - "precision": 0.9417673235855054, - "recall": 0.8733639900955076, - "support": 8481.0 + "f1-score": 0.9123429557878584, + "precision": 0.916385704652731, + "recall": 0.9083357204239473, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8984971414877958, - "precision": 0.8941200517816993, - "recall": 0.9029172973716802, - "support": 14534.0 + "f1-score": 0.8947940947940948, + "precision": 0.8844310641435242, + "recall": 0.9054028555255047, + "support": 15899.0 }, - "eval_accuracy": 0.8557018866659964, - "eval_loss": 1.141819953918457, + "eval_accuracy": 0.8635820895522388, + "eval_loss": 1.1136515140533447, "eval_macro avg": { - "f1-score": 0.8203254333188175, - "precision": 0.8149107346741707, - "recall": 0.8274624182381793, - "support": 29841.0 - }, - "eval_runtime": 4.7777, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 2.093, + "f1-score": 0.8292651844000442, + "precision": 0.8326041734839926, + "recall": 0.8262960003736881, + "support": 33500.0 + }, + "eval_runtime": 4.9179, + "eval_samples_per_second": 16.47, + "eval_steps_per_second": 2.237, "eval_weighted avg": { - "f1-score": 0.857132271461693, - "precision": 0.8597190255498753, - "recall": 0.8557018866659964, - "support": 29841.0 + "f1-score": 0.8625887740134804, + "precision": 0.8618997238752699, + "recall": 0.8635820895522388, + "support": 33500.0 }, "step": 2349 }, { "epoch": 30.0, "eval_Claim": { - "f1-score": 0.6132195178221248, - "precision": 0.6464007782101168, - "recall": 0.5832784726793944, - "support": 4557.0 + "f1-score": 0.6518860985604706, + "precision": 0.677736508630107, + "recall": 0.6279352226720648, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8116131848941279, - "precision": 0.8040657439446367, - "recall": 0.8193036579991185, - "support": 2269.0 + "f1-score": 0.8529746979712788, + "precision": 0.8508412914961346, + "recall": 0.8551188299817185, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9048840121653051, - "precision": 0.9154198841698842, - "recall": 0.8945879023700035, - "support": 8481.0 + "f1-score": 0.911866692352148, + "precision": 0.919930035953746, + "recall": 0.9039434736942614, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9030779085055456, - "precision": 0.8853195849031661, - "recall": 0.9215632310444475, - "support": 14534.0 + "f1-score": 0.8956451812445873, + "precision": 0.8810929227773383, + "recall": 0.9106862066796654, + "support": 15899.0 }, - "eval_accuracy": 0.8544619818370698, - "eval_loss": 1.1914094686508179, + "eval_accuracy": 0.8632537313432835, + "eval_loss": 1.123184084892273, "eval_macro avg": { - "f1-score": 0.8081986558467759, - "precision": 0.8128014978069509, - "recall": 0.804683316023241, - "support": 29841.0 - }, - "eval_runtime": 4.773, - "eval_samples_per_second": 16.761, - "eval_steps_per_second": 2.095, + "f1-score": 0.8280931675321211, + "precision": 0.8324001897143315, + "recall": 0.8244209332569276, + "support": 33500.0 + }, + "eval_runtime": 4.9146, + "eval_samples_per_second": 16.482, + "eval_steps_per_second": 2.238, "eval_weighted avg": { - "f1-score": 0.8523724837851865, - "precision": 0.8512108978901942, - "recall": 0.8544619818370698, - "support": 29841.0 + "f1-score": 0.8619841364675112, + "precision": 0.8612711266927389, + "recall": 0.8632537313432835, + "support": 33500.0 }, "step": 2430 }, { "epoch": 30.86, - "grad_norm": 0.007714413572102785, + "grad_norm": 0.36268848180770874, "learning_rate": 7.654320987654322e-06, - "loss": 0.0028, + "loss": 0.0075, "step": 2500 }, { "epoch": 31.0, "eval_Claim": { - "f1-score": 0.6275360746446783, - "precision": 0.6206008583690987, - "recall": 0.6346280447662936, - "support": 4557.0 + "f1-score": 0.6331647476595287, + "precision": 0.6758557316793017, + "recall": 0.5955465587044534, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8174338447854126, - "precision": 0.8249551166965888, - "recall": 0.8100484795063905, - "support": 2269.0 + "f1-score": 0.8522257916475449, + "precision": 0.8557603686635945, + "recall": 0.8487202925045704, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9020403293163107, - "precision": 0.9129332206255283, - "recall": 0.8914043155288291, - "support": 8481.0 + "f1-score": 0.9158597986057321, + "precision": 0.928901109692625, + "recall": 0.9031796046977943, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8989933575292748, - "precision": 0.8947655398037078, - "recall": 0.9032613182881519, - "support": 14534.0 + "f1-score": 0.8934022573639618, + "precision": 0.8695962843872812, + "recall": 0.9185483363733569, + "support": 15899.0 }, - "eval_accuracy": 0.8517811065312825, - "eval_loss": 1.231397271156311, + "eval_accuracy": 0.8615522388059701, + "eval_loss": 1.120849370956421, "eval_macro avg": { - "f1-score": 0.8115009015689192, - "precision": 0.8133136838737309, - "recall": 0.8098355395224164, - "support": 29841.0 - }, - "eval_runtime": 4.7995, - "eval_samples_per_second": 16.668, - "eval_steps_per_second": 2.084, + "f1-score": 0.8236631488191918, + "precision": 0.8325283736057006, + "recall": 0.8164986980700437, + "support": 33500.0 + }, + "eval_runtime": 4.9277, + "eval_samples_per_second": 16.438, + "eval_steps_per_second": 2.232, "eval_weighted avg": { - "f1-score": 0.8522037725691503, - "precision": 0.8527532680206674, - "recall": 0.8517811065312825, - "support": 29841.0 + "f1-score": 0.8593583894385183, + "precision": 0.858663392490028, + "recall": 0.8615522388059701, + "support": 33500.0 }, "step": 2511 }, { "epoch": 32.0, "eval_Claim": { - "f1-score": 0.6187466523835029, - "precision": 0.6044370029300963, - "recall": 0.6337502743032697, - "support": 4557.0 + "f1-score": 0.6540556600970584, + "precision": 0.6402947450067868, + "recall": 0.6684210526315789, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8172382671480145, - "precision": 0.8372630605640314, - "recall": 0.7981489643014544, - "support": 2269.0 + "f1-score": 0.8491992882562277, + "precision": 0.8271230502599654, + "recall": 0.8724862888482633, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9010989010989012, - "precision": 0.9079482882451521, - "recall": 0.8943520811225092, - "support": 8481.0 + "f1-score": 0.9160624787114983, + "precision": 0.934014685453463, + "recall": 0.8987873579681085, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8937414030261347, - "precision": 0.8933727485219304, - "recall": 0.8941103619100041, - "support": 14534.0 + "f1-score": 0.8915745856353591, + "precision": 0.8899542520523908, + "recall": 0.8932008302408957, + "support": 15899.0 }, - "eval_accuracy": 0.847123085687477, - "eval_loss": 1.2467483282089233, + "eval_accuracy": 0.8604477611940299, + "eval_loss": 1.1111246347427368, "eval_macro avg": { - "f1-score": 0.8077063059141383, - "precision": 0.8107552750653025, - "recall": 0.8050904204093093, - "support": 29841.0 - }, - "eval_runtime": 4.804, - "eval_samples_per_second": 16.653, - "eval_steps_per_second": 2.082, + "f1-score": 0.8277230031750359, + "precision": 0.8228466831931516, + "recall": 0.8332238824222116, + "support": 33500.0 + }, + "eval_runtime": 4.919, + "eval_samples_per_second": 16.467, + "eval_steps_per_second": 2.236, "eval_weighted avg": { - "f1-score": 0.8480211606471663, - "precision": 0.8491256414462351, - "recall": 0.847123085687477, - "support": 29841.0 + "f1-score": 0.8614373038849609, + "precision": 0.8628095441324599, + "recall": 0.8604477611940299, + "support": 33500.0 }, "step": 2592 }, { "epoch": 33.0, "eval_Claim": { - "f1-score": 0.6165579750193435, - "precision": 0.6211581291759466, - "recall": 0.6120254553434277, - "support": 4557.0 + "f1-score": 0.6564330438295295, + "precision": 0.6549778315195486, + "recall": 0.6578947368421053, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8063751884557399, - "precision": 0.7885425442291492, - "recall": 0.8250330542089026, - "support": 2269.0 + "f1-score": 0.8466696468484577, + "precision": 0.8285214348206474, + "recall": 0.8656307129798904, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.905199879771566, - "precision": 0.9233505028207015, - "recall": 0.8877490861926659, - "support": 8481.0 + "f1-score": 0.9148585819449826, + "precision": 0.9282555282555283, + "recall": 0.9018428339539769, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.897230643458119, - "precision": 0.8884841125278283, - "recall": 0.9061510939865144, - "support": 14534.0 + "f1-score": 0.8948586439829872, + "precision": 0.8899048329912297, + "recall": 0.899867916221146, + "support": 15899.0 }, - "eval_accuracy": 0.8498374719345867, - "eval_loss": 1.2608078718185425, + "eval_accuracy": 0.8625671641791045, + "eval_loss": 1.145164132118225, "eval_macro avg": { - "f1-score": 0.8063409216761921, - "precision": 0.8053838221884064, - "recall": 0.8077396724328777, - "support": 29841.0 - }, - "eval_runtime": 4.7947, - "eval_samples_per_second": 16.685, - "eval_steps_per_second": 2.086, + "f1-score": 0.8282049791514892, + "precision": 0.8254149068967386, + "recall": 0.8313090499992797, + "support": 33500.0 + }, + "eval_runtime": 5.0162, + "eval_samples_per_second": 16.148, + "eval_steps_per_second": 2.193, "eval_weighted avg": { - "f1-score": 0.8497258921327092, - "precision": 0.8499709906977834, - "recall": 0.8498374719345867, - "support": 29841.0 + "f1-score": 0.862804893528884, + "precision": 0.8632421634102047, + "recall": 0.8625671641791045, + "support": 33500.0 }, "step": 2673 }, { "epoch": 34.0, "eval_Claim": { - "f1-score": 0.6242761692650335, - "precision": 0.633732760569749, - "recall": 0.6150976519640114, - "support": 4557.0 + "f1-score": 0.6356152512998267, + "precision": 0.6835973904939422, + "recall": 0.5939271255060729, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8270332187857962, - "precision": 0.8611641221374046, - "recall": 0.7955046275892463, - "support": 2269.0 + "f1-score": 0.8559207564160288, + "precision": 0.8433895297249334, + "recall": 0.8688299817184644, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9015324995596267, - "precision": 0.8978947368421053, - "recall": 0.9051998585072515, - "support": 8481.0 + "f1-score": 0.9127349443805141, + "precision": 0.9166907444861794, + "recall": 0.9088131385467393, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8962669760458609, - "precision": 0.8890468453831574, - "recall": 0.9036053392046236, - "support": 14534.0 + "f1-score": 0.8947336002463814, + "precision": 0.876591635990586, + "recall": 0.9136423674444933, + "support": 15899.0 }, - "eval_accuracy": 0.8517811065312825, - "eval_loss": 1.2305262088775635, + "eval_accuracy": 0.8620597014925373, + "eval_loss": 1.1328134536743164, "eval_macro avg": { - "f1-score": 0.8122772159140793, - "precision": 0.820459616233104, - "recall": 0.8048518693162833, - "support": 29841.0 - }, - "eval_runtime": 4.7809, - "eval_samples_per_second": 16.733, - "eval_steps_per_second": 2.092, + "f1-score": 0.8247511380856878, + "precision": 0.8300673251739102, + "recall": 0.8213031533039424, + "support": 33500.0 + }, + "eval_runtime": 4.886, + "eval_samples_per_second": 16.578, + "eval_steps_per_second": 2.251, "eval_weighted avg": { - "f1-score": 0.8509636485165197, - "precision": 0.8504525215978962, - "recall": 0.8517811065312825, - "support": 29841.0 + "f1-score": 0.8596160160977241, + "precision": 0.858499701125263, + "recall": 0.8620597014925373, + "support": 33500.0 }, "step": 2754 }, { "epoch": 35.0, "eval_Claim": { - "f1-score": 0.633076593923834, - "precision": 0.6176163640158631, - "recall": 0.6493307000219443, - "support": 4557.0 + "f1-score": 0.6474583247581807, + "precision": 0.6584344914190038, + "recall": 0.6368421052631579, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8311867525298988, - "precision": 0.8691678691678691, - "recall": 0.7963860731599823, - "support": 2269.0 + "f1-score": 0.8435185185185186, + "precision": 0.8545966228893058, + "recall": 0.8327239488117002, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9039272770483037, - "precision": 0.9110179640718563, - "recall": 0.8969461148449476, - "support": 8481.0 + "f1-score": 0.9133458015633241, + "precision": 0.9174373795761079, + "recall": 0.9092905566695312, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8963128108386212, - "precision": 0.8936461254360167, - "recall": 0.8989954589239025, - "support": 14534.0 + "f1-score": 0.8930206484163319, + "precision": 0.8844540407156076, + "recall": 0.9017548273476319, + "support": 15899.0 }, - "eval_accuracy": 0.8524848362990516, - "eval_loss": 1.2047479152679443, + "eval_accuracy": 0.8605373134328358, + "eval_loss": 1.16542649269104, "eval_macro avg": { - "f1-score": 0.8161258585851644, - "precision": 0.8228620806729012, - "recall": 0.8104145867376942, - "support": 29841.0 - }, - "eval_runtime": 4.7907, - "eval_samples_per_second": 16.699, - "eval_steps_per_second": 2.087, + "f1-score": 0.8243358233140887, + "precision": 0.8287306336500063, + "recall": 0.8201528595230052, + "support": 33500.0 + }, + "eval_runtime": 4.925, + "eval_samples_per_second": 16.447, + "eval_steps_per_second": 2.233, "eval_weighted avg": { - "f1-score": 0.8533263097542454, - "precision": 0.8545697465347227, - "recall": 0.8524848362990516, - "support": 29841.0 + "f1-score": 0.8599304033363548, + "precision": 0.8594859781531254, + "recall": 0.8605373134328358, + "support": 33500.0 }, "step": 2835 }, { "epoch": 36.0, "eval_Claim": { - "f1-score": 0.6346997752327946, - "precision": 0.6195152528207272, - "recall": 0.6506473557164801, - "support": 4557.0 + "f1-score": 0.63220675944334, + "precision": 0.654320987654321, + "recall": 0.6115384615384616, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8192934782608694, - "precision": 0.8425710293432697, - "recall": 0.7972675187307183, - "support": 2269.0 + "f1-score": 0.8513604677310547, + "precision": 0.8379814077025233, + "recall": 0.8651736745886655, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9063178271836687, - "precision": 0.9018211533971515, - "recall": 0.9108595684471171, - "support": 8481.0 + "f1-score": 0.9143658430443401, + "precision": 0.9262343260188087, + "recall": 0.9027976701995608, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8959689707715751, - "precision": 0.9019662529633246, - "recall": 0.8900509150956378, - "support": 14534.0 + "f1-score": 0.8918458920006188, + "precision": 0.8778021442495126, + "recall": 0.9063463110887477, + "support": 15899.0 }, - "eval_accuracy": 0.8523507925337622, - "eval_loss": 1.2302902936935425, + "eval_accuracy": 0.8590746268656716, + "eval_loss": 1.1980067491531372, "eval_macro avg": { - "f1-score": 0.8140700128622269, - "precision": 0.8164684221311183, - "recall": 0.8122063394974884, - "support": 29841.0 - }, - "eval_runtime": 4.803, - "eval_samples_per_second": 16.656, - "eval_steps_per_second": 2.082, + "f1-score": 0.8224447405548384, + "precision": 0.8240847164062914, + "recall": 0.8214640293538589, + "support": 33500.0 + }, + "eval_runtime": 4.9337, + "eval_samples_per_second": 16.418, + "eval_steps_per_second": 2.23, "eval_weighted avg": { - "f1-score": 0.8531818066233882, - "precision": 0.8542759088239045, - "recall": 0.8523507925337622, - "support": 29841.0 + "f1-score": 0.857954907646772, + "precision": 0.8573873846830882, + "recall": 0.8590746268656716, + "support": 33500.0 }, "step": 2916 }, { "epoch": 37.0, "eval_Claim": { - "f1-score": 0.6348107625320978, - "precision": 0.6461363636363636, - "recall": 0.6238753565942506, - "support": 4557.0 + "f1-score": 0.6368211365066052, + "precision": 0.6605045672031318, + "recall": 0.6147773279352227, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.821917808219178, - "precision": 0.8526764566556134, - "recall": 0.7933010136624064, - "support": 2269.0 + "f1-score": 0.8573378839590444, + "precision": 0.8536474852741278, + "recall": 0.8610603290676416, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9034164794893014, - "precision": 0.9057721939077872, - "recall": 0.9010729866760995, - "support": 8481.0 + "f1-score": 0.9157544485701886, + "precision": 0.9250779423226813, + "recall": 0.9066170151818963, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9000577700751011, - "precision": 0.8892096958302558, - "recall": 0.9111737993670015, - "support": 14534.0 + "f1-score": 0.8922981750695949, + "precision": 0.8778528391455176, + "recall": 0.9072268696144412, + "support": 15899.0 }, - "eval_accuracy": 0.85546731007674, - "eval_loss": 1.2363109588623047, + "eval_accuracy": 0.8608955223880597, + "eval_loss": 1.1901870965957642, "eval_macro avg": { - "f1-score": 0.8150507050789195, - "precision": 0.823448677507505, - "recall": 0.8073557890749394, - "support": 29841.0 - }, - "eval_runtime": 4.7822, - "eval_samples_per_second": 16.729, - "eval_steps_per_second": 2.091, + "f1-score": 0.8255529110263582, + "precision": 0.8292707084863646, + "recall": 0.8224203854498005, + "support": 33500.0 + }, + "eval_runtime": 4.927, + "eval_samples_per_second": 16.44, + "eval_steps_per_second": 2.233, "eval_weighted avg": { - "f1-score": 0.8545651601664946, - "precision": 0.8540194358423435, - "recall": 0.85546731007674, - "support": 29841.0 + "f1-score": 0.859674529246331, + "precision": 0.8589849802771131, + "recall": 0.8608955223880597, + "support": 33500.0 }, "step": 2997 }, { "epoch": 37.04, - "grad_norm": 0.3124696612358093, + "grad_norm": 0.8262068033218384, "learning_rate": 5.185185185185185e-06, - "loss": 0.0015, + "loss": 0.0042, "step": 3000 }, { "epoch": 38.0, "eval_Claim": { - "f1-score": 0.6297771557756486, - "precision": 0.6181318681318682, - "recall": 0.6418696510862409, - "support": 4557.0 + "f1-score": 0.6409235668789809, + "precision": 0.6303837118245889, + "recall": 0.6518218623481782, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8197488827410088, - "precision": 0.7925925925925926, - "recall": 0.8488320846187748, - "support": 2269.0 + "f1-score": 0.8523321956769055, + "precision": 0.8486633439057544, + "recall": 0.8560329067641682, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9054678007290401, - "precision": 0.9339516230104024, - "recall": 0.8786699681641316, - "support": 8481.0 + "f1-score": 0.9147144240077445, + "precision": 0.9275547266123491, + "recall": 0.9022247684522104, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8958062529930902, - "precision": 0.8907482993197279, - "recall": 0.9009219760561442, - "support": 14534.0 + "f1-score": 0.8904285669498698, + "precision": 0.8876734591823978, + "recall": 0.8932008302408957, + "support": 15899.0 }, - "eval_accuracy": 0.8510773767635132, - "eval_loss": 1.264951467514038, + "eval_accuracy": 0.858, + "eval_loss": 1.198099136352539, "eval_macro avg": { - "f1-score": 0.812700023059697, - "precision": 0.8088560957636478, - "recall": 0.8175734199813228, - "support": 29841.0 - }, - "eval_runtime": 4.8007, - "eval_samples_per_second": 16.664, - "eval_steps_per_second": 2.083, + "f1-score": 0.8245996883783752, + "precision": 0.8235688103812725, + "recall": 0.8258200919513632, + "support": 33500.0 + }, + "eval_runtime": 4.9138, + "eval_samples_per_second": 16.484, + "eval_steps_per_second": 2.239, "eval_weighted avg": { - "f1-score": 0.8521438696020087, - "precision": 0.8539324758799526, - "recall": 0.8510773767635132, - "support": 29841.0 + "f1-score": 0.8587400959132037, + "precision": 0.8596528929024279, + "recall": 0.858, + "support": 33500.0 }, "step": 3078 }, { "epoch": 39.0, "eval_Claim": { - "f1-score": 0.6320949994552784, - "precision": 0.6276503678061445, - "recall": 0.6366030283080975, - "support": 4557.0 + "f1-score": 0.6499377851513894, + "precision": 0.6662414965986394, + "recall": 0.6344129554655871, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8298865910607072, - "precision": 0.8375224416517055, - "recall": 0.8223887174966946, - "support": 2269.0 + "f1-score": 0.8481362172112287, + "precision": 0.8540315106580166, + "recall": 0.8423217550274223, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9067027918482744, - "precision": 0.90584912321996, - "recall": 0.9075580709821955, - "support": 8481.0 + "f1-score": 0.9112606807007495, + "precision": 0.9111302023673158, + "recall": 0.9113911964098157, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.897340498828717, - "precision": 0.8985787222298882, - "recall": 0.8961056832255401, - "support": 14534.0 + "f1-score": 0.8928604847010387, + "precision": 0.8855958420987502, + "recall": 0.9002452984464432, + "support": 15899.0 }, - "eval_accuracy": 0.8541268724238464, - "eval_loss": 1.2218141555786133, + "eval_accuracy": 0.8607462686567164, + "eval_loss": 1.214090347290039, "eval_macro avg": { - "f1-score": 0.8165062202982443, - "precision": 0.8174001637269246, - "recall": 0.8156638750031319, - "support": 29841.0 - }, - "eval_runtime": 4.7791, - "eval_samples_per_second": 16.74, - "eval_steps_per_second": 2.092, + "f1-score": 0.8255487919411015, + "precision": 0.8292497629306805, + "recall": 0.822092801337317, + "support": 33500.0 + }, + "eval_runtime": 4.9164, + "eval_samples_per_second": 16.475, + "eval_steps_per_second": 2.237, "eval_weighted avg": { - "f1-score": 0.8543669037658335, - "precision": 0.85462922519748, - "recall": 0.8541268724238464, - "support": 29841.0 + "f1-score": 0.8598697509596058, + "precision": 0.8591704131772522, + "recall": 0.8607462686567164, + "support": 33500.0 }, "step": 3159 }, { "epoch": 40.0, "eval_Claim": { - "f1-score": 0.6463350510043117, - "precision": 0.6205573505654282, - "recall": 0.674347158218126, - "support": 4557.0 + "f1-score": 0.6468762929251138, + "precision": 0.6613790186125211, + "recall": 0.632995951417004, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8254958769779362, - "precision": 0.8349864743011722, - "recall": 0.8162185985015425, - "support": 2269.0 + "f1-score": 0.8509220173294822, + "precision": 0.8279290964115866, + "recall": 0.8752285191956124, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9064204783885857, - "precision": 0.9219512195121952, - "recall": 0.8914043155288291, - "support": 8481.0 + "f1-score": 0.9132591629340654, + "precision": 0.921379980563654, + "recall": 0.9052802444380789, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8983278745043958, - "precision": 0.9002833252712321, - "recall": 0.8963808999587175, - "support": 14534.0 + "f1-score": 0.8917924410627417, + "precision": 0.8843465891520812, + "recall": 0.8993647399207497, + "support": 15899.0 }, - "eval_accuracy": 0.8549646459569049, - "eval_loss": 1.2532273530960083, + "eval_accuracy": 0.8603582089552239, + "eval_loss": 1.218752145767212, "eval_macro avg": { - "f1-score": 0.8191448202188073, - "precision": 0.8194445924125069, - "recall": 0.8195877430518038, - "support": 29841.0 - }, - "eval_runtime": 4.7911, - "eval_samples_per_second": 16.697, - "eval_steps_per_second": 2.087, + "f1-score": 0.8257124785628508, + "precision": 0.8237586711849608, + "recall": 0.8282173637428613, + "support": 33500.0 + }, + "eval_runtime": 5.1955, + "eval_samples_per_second": 15.59, + "eval_steps_per_second": 2.117, "eval_weighted avg": { - "f1-score": 0.8566083032589413, - "precision": 0.8587597700777799, - "recall": 0.8549646459569049, - "support": 29841.0 + "f1-score": 0.8597181341740886, + "precision": 0.8593600051422834, + "recall": 0.8603582089552239, + "support": 33500.0 }, "step": 3240 }, { "epoch": 41.0, "eval_Claim": { - "f1-score": 0.6371372463451888, - "precision": 0.6335430679106097, - "recall": 0.6407724380074611, - "support": 4557.0 + "f1-score": 0.646806774127729, + "precision": 0.6519950637597697, + "recall": 0.6417004048582996, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8270404702690481, - "precision": 0.8491179201485608, - "recall": 0.8060819744380785, - "support": 2269.0 + "f1-score": 0.8511878081577768, + "precision": 0.8350923482849604, + "recall": 0.8679159049360147, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9051774973463852, - "precision": 0.905391058157367, - "recall": 0.9049640372597572, - "support": 8481.0 + "f1-score": 0.9144551375522505, + "precision": 0.9312939312939313, + "recall": 0.8982144562207581, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8991934099879869, - "precision": 0.8971303335387987, - "recall": 0.9012659969726159, - "support": 14534.0 + "f1-score": 0.8959641813320066, + "precision": 0.8859374039230155, + "recall": 0.9062205170136487, + "support": 15899.0 }, - "eval_accuracy": 0.8552997553701284, - "eval_loss": 1.2720471620559692, + "eval_accuracy": 0.8622089552238806, + "eval_loss": 1.1967241764068604, "eval_macro avg": { - "f1-score": 0.8171371559871523, - "precision": 0.821295594938834, - "recall": 0.8132711116694782, - "support": 29841.0 - }, - "eval_runtime": 4.7858, - "eval_samples_per_second": 16.716, - "eval_steps_per_second": 2.09, + "f1-score": 0.8271034752924407, + "precision": 0.8260796868154192, + "recall": 0.8285128207571802, + "support": 33500.0 + }, + "eval_runtime": 4.9208, + "eval_samples_per_second": 16.461, + "eval_steps_per_second": 2.235, "eval_weighted avg": { - "f1-score": 0.8553894519083003, - "precision": 0.8555751534188286, - "recall": 0.8552997553701284, - "support": 29841.0 + "f1-score": 0.8620790317320146, + "precision": 0.8622984418040036, + "recall": 0.8622089552238806, + "support": 33500.0 }, "step": 3321 }, { "epoch": 42.0, "eval_Claim": { - "f1-score": 0.6300342759211655, - "precision": 0.6154007114459091, - "recall": 0.6453807329383366, - "support": 4557.0 + "f1-score": 0.6463245492371706, + "precision": 0.63290648040357, + "recall": 0.6603238866396761, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8309070548712206, - "precision": 0.8447176684881603, - "recall": 0.8175407668576465, - "support": 2269.0 + "f1-score": 0.8430155210643016, + "precision": 0.8186907838070628, + "recall": 0.8688299817184644, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9059788703299297, - "precision": 0.9069959820373434, - "recall": 0.9049640372597572, - "support": 8481.0 + "f1-score": 0.9103991443434294, + "precision": 0.9273969889064976, + "recall": 0.8940131767401891, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8946713663694795, - "precision": 0.8987086920299917, - "recall": 0.8906701527452869, - "support": 14534.0 + "f1-score": 0.8930782040405945, + "precision": 0.8922651933701657, + "recall": 0.8938926976539405, + "support": 15899.0 }, - "eval_accuracy": 0.8517140846486377, - "eval_loss": 1.273967981338501, + "eval_accuracy": 0.8578507462686568, + "eval_loss": 1.2189435958862305, "eval_macro avg": { - "f1-score": 0.8153978918729488, - "precision": 0.8164557635003511, - "recall": 0.8146389224502568, - "support": 29841.0 - }, - "eval_runtime": 4.785, - "eval_samples_per_second": 16.719, - "eval_steps_per_second": 2.09, + "f1-score": 0.8232043546713739, + "precision": 0.817814861621824, + "recall": 0.8292649356880676, + "support": 33500.0 + }, + "eval_runtime": 4.9128, + "eval_samples_per_second": 16.488, + "eval_steps_per_second": 2.239, "eval_weighted avg": { - "f1-score": 0.8526240655794947, - "precision": 0.8536949326591351, - "recall": 0.8517140846486377, - "support": 29841.0 + "f1-score": 0.8588364727782227, + "precision": 0.8601972066380149, + "recall": 0.8578507462686568, + "support": 33500.0 }, "step": 3402 }, { "epoch": 43.0, "eval_Claim": { - "f1-score": 0.6327562103451985, - "precision": 0.620413327709827, - "recall": 0.6456001755540927, - "support": 4557.0 + "f1-score": 0.6505707647237094, + "precision": 0.6493244605767292, + "recall": 0.6518218623481782, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8331148973350809, - "precision": 0.8258986574274578, - "recall": 0.8404583516967827, - "support": 2269.0 + "f1-score": 0.8504863153132776, + "precision": 0.8419167039856695, + "recall": 0.8592321755027422, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9066080864454076, - "precision": 0.9130590767758909, - "recall": 0.9002476123098692, - "support": 8481.0 + "f1-score": 0.9151807228915662, + "precision": 0.9239077551814732, + "recall": 0.9066170151818963, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8955873213175887, - "precision": 0.8988771832547824, - "recall": 0.8923214531443512, - "support": 14534.0 + "f1-score": 0.8942687128092702, + "precision": 0.8905869877113093, + "recall": 0.8979810050946601, + "support": 15899.0 }, - "eval_accuracy": 0.8529539894775644, - "eval_loss": 1.2849647998809814, + "eval_accuracy": 0.8618507462686568, + "eval_loss": 1.2199524641036987, "eval_macro avg": { - "f1-score": 0.8170166288608189, - "precision": 0.8145620612919895, - "recall": 0.819656898176274, - "support": 29841.0 - }, - "eval_runtime": 4.7796, - "eval_samples_per_second": 16.738, - "eval_steps_per_second": 2.092, + "f1-score": 0.8276266289344558, + "precision": 0.8264339768637954, + "recall": 0.8289130145318692, + "support": 33500.0 + }, + "eval_runtime": 4.8976, + "eval_samples_per_second": 16.539, + "eval_steps_per_second": 2.246, "eval_weighted avg": { - "f1-score": 0.8538325478961732, - "precision": 0.8548347106208881, - "recall": 0.8529539894775644, - "support": 29841.0 + "f1-score": 0.8620104361623443, + "precision": 0.8622479110808169, + "recall": 0.8618507462686568, + "support": 33500.0 }, "step": 3483 }, { "epoch": 43.21, - "grad_norm": 11.103137969970703, + "grad_norm": 0.7243998050689697, "learning_rate": 2.7160493827160496e-06, - "loss": 0.001, + "loss": 0.0038, "step": 3500 }, { "epoch": 44.0, "eval_Claim": { - "f1-score": 0.6296918767507003, - "precision": 0.6433150183150184, - "recall": 0.6166337502743032, - "support": 4557.0 + "f1-score": 0.649113924050633, + "precision": 0.6494427558257345, + "recall": 0.6487854251012146, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8321428571428572, - "precision": 0.8430574400723655, - "recall": 0.8215072719259586, - "support": 2269.0 + "f1-score": 0.8521934758155231, + "precision": 0.8391670358883474, + "recall": 0.8656307129798904, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.908139604019264, - "precision": 0.9159270808347325, - "recall": 0.9004834335573635, - "support": 8481.0 + "f1-score": 0.9142580488985719, + "precision": 0.9273227263798861, + "recall": 0.9015563830803017, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.9008079299341435, - "precision": 0.8890377914768158, - "recall": 0.9128939039493601, - "support": 14534.0 + "f1-score": 0.8929898516783762, + "precision": 0.886704700483691, + "recall": 0.8993647399207497, + "support": 15899.0 }, - "eval_accuracy": 0.8571763680841795, - "eval_loss": 1.2746751308441162, + "eval_accuracy": 0.8608955223880597, + "eval_loss": 1.2192212343215942, "eval_macro avg": { - "f1-score": 0.8176955669617412, - "precision": 0.822834332674733, - "recall": 0.8128795899267465, - "support": 29841.0 - }, - "eval_runtime": 4.7778, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 2.093, + "f1-score": 0.827138825110776, + "precision": 0.8256593046444147, + "recall": 0.8288343152705391, + "support": 33500.0 + }, + "eval_runtime": 4.9247, + "eval_samples_per_second": 16.448, + "eval_steps_per_second": 2.234, "eval_weighted avg": { - "f1-score": 0.8562686391394492, - "precision": 0.8556595524234826, - "recall": 0.8571763680841795, - "support": 29841.0 + "f1-score": 0.8610117106819026, + "precision": 0.8613108547662561, + "recall": 0.8608955223880597, + "support": 33500.0 }, "step": 3564 }, { "epoch": 45.0, "eval_Claim": { - "f1-score": 0.6363438992618324, - "precision": 0.6296455424274973, - "recall": 0.6431863067807768, - "support": 4557.0 + "f1-score": 0.6460396039603961, + "precision": 0.6585365853658537, + "recall": 0.6340080971659919, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8294691224268689, - "precision": 0.8158567774936062, - "recall": 0.8435434111943587, - "support": 2269.0 + "f1-score": 0.85500340367597, + "precision": 0.8490310950878774, + "recall": 0.8610603290676416, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9093409879201052, - "precision": 0.9225822108967359, - "recall": 0.8964744723499587, - "support": 8481.0 + "f1-score": 0.9148556835156363, + "precision": 0.923443579766537, + "recall": 0.9064260479327795, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8978134761267291, - "precision": 0.8958147818343722, - "recall": 0.8998211091234347, - "support": 14534.0 + "f1-score": 0.8931060228969636, + "precision": 0.8835949522930132, + "recall": 0.902824076985974, + "support": 15899.0 }, - "eval_accuracy": 0.8554002881940954, - "eval_loss": 1.2960079908370972, + "eval_accuracy": 0.8615820895522388, + "eval_loss": 1.2218410968780518, "eval_macro avg": { - "f1-score": 0.8182418714338839, - "precision": 0.8159748281630528, - "recall": 0.8207563248621323, - "support": 29841.0 - }, - "eval_runtime": 4.79, - "eval_samples_per_second": 16.701, - "eval_steps_per_second": 2.088, + "f1-score": 0.8272511785122416, + "precision": 0.8286515531283204, + "recall": 0.8260796377880968, + "support": 33500.0 + }, + "eval_runtime": 4.9427, + "eval_samples_per_second": 16.388, + "eval_steps_per_second": 2.226, "eval_weighted avg": { - "f1-score": 0.8559641623370206, - "precision": 0.8566960066610061, - "recall": 0.8554002881940954, - "support": 29841.0 + "f1-score": 0.8609838603673272, + "precision": 0.8606075082137657, + "recall": 0.8615820895522388, + "support": 33500.0 }, "step": 3645 }, { "epoch": 46.0, "eval_Claim": { - "f1-score": 0.6322691604858648, - "precision": 0.6196797302991993, - "recall": 0.6453807329383366, - "support": 4557.0 + "f1-score": 0.6521695155254374, + "precision": 0.6517081059227815, + "recall": 0.6526315789473685, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8332607749238136, - "precision": 0.8232258064516129, - "recall": 0.8435434111943587, - "support": 2269.0 + "f1-score": 0.8555098308184728, + "precision": 0.8559011893870082, + "recall": 0.8551188299817185, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9089284650664124, - "precision": 0.9183919114106885, - "recall": 0.8996580591911332, - "support": 8481.0 + "f1-score": 0.9134518133217743, + "precision": 0.9215743440233236, + "recall": 0.9054712116871957, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.895985653193544, - "precision": 0.8982160143825197, - "recall": 0.8937663409935324, - "support": 14534.0 + "f1-score": 0.8919814861145858, + "precision": 0.8870436026621882, + "recall": 0.8969746524938675, + "support": 15899.0 }, - "eval_accuracy": 0.8536912301866559, - "eval_loss": 1.2958593368530273, + "eval_accuracy": 0.8608656716417911, + "eval_loss": 1.2380608320236206, "eval_macro avg": { - "f1-score": 0.8176110134174086, - "precision": 0.8148783656360051, - "recall": 0.8205871360793402, - "support": 29841.0 - }, - "eval_runtime": 4.7995, - "eval_samples_per_second": 16.668, - "eval_steps_per_second": 2.084, + "f1-score": 0.8282781614450676, + "precision": 0.8290568104988254, + "recall": 0.8275490682775376, + "support": 33500.0 + }, + "eval_runtime": 4.9319, + "eval_samples_per_second": 16.424, + "eval_steps_per_second": 2.23, "eval_weighted avg": { - "f1-score": 0.8546227357789428, - "precision": 0.8557130538360561, - "recall": 0.8536912301866559, - "support": 29841.0 + "f1-score": 0.8609482807516783, + "precision": 0.8611016175916333, + "recall": 0.8608656716417911, + "support": 33500.0 }, "step": 3726 }, { "epoch": 47.0, "eval_Claim": { - "f1-score": 0.6343719035560937, - "precision": 0.6365444100751215, - "recall": 0.6322141759929778, - "support": 4557.0 + "f1-score": 0.6483549652882584, + "precision": 0.6445289057811562, + "recall": 0.6522267206477733, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8321970530019793, - "precision": 0.8305531167690957, - "recall": 0.8338475099162627, - "support": 2269.0 + "f1-score": 0.8573378839590444, + "precision": 0.8536474852741278, + "recall": 0.8610603290676416, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9086917828537526, - "precision": 0.9144972534033915, - "recall": 0.9029595566560548, - "support": 8481.0 + "f1-score": 0.9157894736842105, + "precision": 0.9263456090651558, + "recall": 0.9054712116871957, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8988594718635478, - "precision": 0.8949055445679601, - "recall": 0.9028484931883859, - "support": 14534.0 + "f1-score": 0.8921016397546626, + "precision": 0.887712524132777, + "recall": 0.8965343732310208, + "support": 15899.0 }, - "eval_accuracy": 0.8563050836097986, - "eval_loss": 1.28843092918396, + "eval_accuracy": 0.8609850746268657, + "eval_loss": 1.2338788509368896, "eval_macro avg": { - "f1-score": 0.8185300528188434, - "precision": 0.8191250812038922, - "recall": 0.8179674339384202, - "support": 29841.0 - }, - "eval_runtime": 4.7779, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 2.093, + "f1-score": 0.8283959906715441, + "precision": 0.8280586310633042, + "recall": 0.8288231586584078, + "support": 33500.0 + }, + "eval_runtime": 5.0503, + "eval_samples_per_second": 16.039, + "eval_steps_per_second": 2.178, "eval_weighted avg": { - "f1-score": 0.8561953839420291, - "precision": 0.8561263459510842, - "recall": 0.8563050836097986, - "support": 29841.0 + "f1-score": 0.8612930133427016, + "precision": 0.861704850067615, + "recall": 0.8609850746268657, + "support": 33500.0 }, "step": 3807 }, { "epoch": 48.0, "eval_Claim": { - "f1-score": 0.6376558058167504, - "precision": 0.6354325561124428, - "recall": 0.6398946675444371, - "support": 4557.0 + "f1-score": 0.6475201140645687, + "precision": 0.6515679442508711, + "recall": 0.6435222672064778, + "support": 4940.0 }, "eval_MajorClaim": { - "f1-score": 0.8332228849127457, - "precision": 0.8352524357838795, - "recall": 0.8312031732040547, - "support": 2269.0 + "f1-score": 0.8567530695770805, + "precision": 0.8524886877828054, + "recall": 0.8610603290676416, + "support": 2188.0 }, "eval_O": { - "f1-score": 0.9087235559781318, - "precision": 0.9160177309212891, - "recall": 0.9015446291710884, - "support": 8481.0 + "f1-score": 0.9163250542560887, + "precision": 0.9257454687195479, + "recall": 0.9070944333046882, + "support": 10473.0 }, "eval_Premise": { - "f1-score": 0.8999006202666118, - "precision": 0.8964293029289274, - "recall": 0.9033989266547406, - "support": 14534.0 + "f1-score": 0.8935346979530704, + "precision": 0.8866183664623196, + "recall": 0.9005597836341909, + "support": 15899.0 }, - "eval_accuracy": 0.8571428571428571, - "eval_loss": 1.2850925922393799, + "eval_accuracy": 0.8621194029850746, + "eval_loss": 1.2307249307632446, "eval_macro avg": { - "f1-score": 0.81987571674356, - "precision": 0.8207830064366348, - "recall": 0.8190103491435802, - "support": 29841.0 - }, - "eval_runtime": 4.7863, - "eval_samples_per_second": 16.714, - "eval_steps_per_second": 2.089, + "f1-score": 0.8285332339627021, + "precision": 0.8291051168038859, + "recall": 0.8280592033032497, + "support": 33500.0 + }, + "eval_runtime": 4.9169, + "eval_samples_per_second": 16.474, + "eval_steps_per_second": 2.237, "eval_weighted avg": { - "f1-score": 0.8572909864340814, - "precision": 0.8574881471703532, - "recall": 0.8571428571428571, - "support": 29841.0 + "f1-score": 0.8619792697221943, + "precision": 0.8619602565896216, + "recall": 0.8621194029850746, + "support": 33500.0 }, "step": 3888 } @@ -2223,7 +2223,7 @@ "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, - "total_flos": 6901859170886400.0, + "total_flos": 6880424825635200.0, "train_batch_size": 4, "trial_name": null, "trial_params": null