|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 9.0, |
|
"eval_steps": 500, |
|
"global_step": 729, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_Claim": { |
|
"f1-score": 0.4888068880688806, |
|
"precision": 0.6228840125391849, |
|
"recall": 0.40222672064777326, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.7325278370054489, |
|
"precision": 0.7604525332021643, |
|
"recall": 0.706581352833638, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.8634848138844484, |
|
"precision": 0.827613377692173, |
|
"recall": 0.902606702950444, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8792819197655248, |
|
"precision": 0.8543458914268763, |
|
"recall": 0.9057173407132524, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8174925373134329, |
|
"eval_loss": 0.49806877970695496, |
|
"eval_macro avg": { |
|
"f1-score": 0.7410253646810757, |
|
"precision": 0.7663239537150996, |
|
"recall": 0.7292830292862769, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9194, |
|
"eval_samples_per_second": 16.465, |
|
"eval_steps_per_second": 2.236, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8071778099281224, |
|
"precision": 0.80572410140167, |
|
"recall": 0.8174925373134329, |
|
"support": 33500.0 |
|
}, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_Claim": { |
|
"f1-score": 0.5993816254416962, |
|
"precision": 0.6593780369290574, |
|
"recall": 0.5493927125506073, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8017817371937639, |
|
"precision": 0.7197382769901853, |
|
"recall": 0.9049360146252285, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9058997050147494, |
|
"precision": 0.9337184554575859, |
|
"recall": 0.8796906330564308, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8854737486606459, |
|
"precision": 0.862579028987236, |
|
"recall": 0.9096169570413234, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8468358208955223, |
|
"eval_loss": 0.4562840759754181, |
|
"eval_macro avg": { |
|
"f1-score": 0.7981342040777137, |
|
"precision": 0.7938534495910161, |
|
"recall": 0.8109090793183975, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.904, |
|
"eval_samples_per_second": 16.517, |
|
"eval_steps_per_second": 2.243, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8442053257085675, |
|
"precision": 0.8455251408465503, |
|
"recall": 0.8468358208955223, |
|
"support": 33500.0 |
|
}, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6235462150581514, |
|
"precision": 0.6285479226655697, |
|
"recall": 0.6186234817813765, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8338848444738584, |
|
"precision": 0.8059701492537313, |
|
"recall": 0.8638025594149908, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9066250826953974, |
|
"precision": 0.8974646833193002, |
|
"recall": 0.9159744103886184, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8827730692315017, |
|
"precision": 0.8911176621379133, |
|
"recall": 0.8745833071262343, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8490746268656716, |
|
"eval_loss": 0.43820467591285706, |
|
"eval_macro avg": { |
|
"f1-score": 0.8117073028647273, |
|
"precision": 0.8057751043441286, |
|
"recall": 0.818245939677805, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9179, |
|
"eval_samples_per_second": 16.47, |
|
"eval_steps_per_second": 2.237, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8488105033097496, |
|
"precision": 0.8488213959184715, |
|
"recall": 0.8490746268656716, |
|
"support": 33500.0 |
|
}, |
|
"step": 243 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6415287144900879, |
|
"precision": 0.6477507222451506, |
|
"recall": 0.6354251012145749, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8005126014523707, |
|
"precision": 0.7514033680834001, |
|
"recall": 0.856489945155393, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9065169636319258, |
|
"precision": 0.9273871354374751, |
|
"recall": 0.8865654540246348, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8932505382719131, |
|
"precision": 0.8863636363636364, |
|
"recall": 0.9002452984464432, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8540597014925373, |
|
"eval_loss": 0.4749625325202942, |
|
"eval_macro avg": { |
|
"f1-score": 0.8104522044615743, |
|
"precision": 0.8032262155324155, |
|
"recall": 0.8196814497102615, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.8972, |
|
"eval_samples_per_second": 16.54, |
|
"eval_steps_per_second": 2.246, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8542213698406307, |
|
"precision": 0.8551874645146165, |
|
"recall": 0.8540597014925373, |
|
"support": 33500.0 |
|
}, |
|
"step": 324 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6099687080911935, |
|
"precision": 0.6808882235528942, |
|
"recall": 0.5524291497975709, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8315018315018317, |
|
"precision": 0.8330275229357799, |
|
"recall": 0.829981718464351, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9103454839630722, |
|
"precision": 0.9074091642159188, |
|
"recall": 0.9133008689009835, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8913988368533824, |
|
"precision": 0.8682249120505635, |
|
"recall": 0.915843763758727, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8558507462686568, |
|
"eval_loss": 0.5162495374679565, |
|
"eval_macro avg": { |
|
"f1-score": 0.8108037151023699, |
|
"precision": 0.8223874556887891, |
|
"recall": 0.8028888752304081, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9413, |
|
"eval_samples_per_second": 16.392, |
|
"eval_steps_per_second": 2.226, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8519095458499607, |
|
"precision": 0.8505509283002989, |
|
"recall": 0.8558507462686568, |
|
"support": 33500.0 |
|
}, |
|
"step": 405 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_Claim": { |
|
"f1-score": 0.646279703934554, |
|
"precision": 0.6227477477477478, |
|
"recall": 0.6716599190283401, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8414067684140676, |
|
"precision": 0.8152593227603944, |
|
"recall": 0.8692870201096892, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9112506693929215, |
|
"precision": 0.9295788637266588, |
|
"recall": 0.8936312422419556, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8861383012314494, |
|
"precision": 0.8897343224906474, |
|
"recall": 0.8825712308950249, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8540597014925373, |
|
"eval_loss": 0.552895724773407, |
|
"eval_macro avg": { |
|
"f1-score": 0.8212688607432481, |
|
"precision": 0.8143300641813621, |
|
"recall": 0.8292873530687525, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9336, |
|
"eval_samples_per_second": 16.418, |
|
"eval_steps_per_second": 2.23, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8556973390614198, |
|
"precision": 0.8579560210496036, |
|
"recall": 0.8540597014925373, |
|
"support": 33500.0 |
|
}, |
|
"step": 486 |
|
}, |
|
{ |
|
"epoch": 6.17, |
|
"grad_norm": 9.790245056152344, |
|
"learning_rate": 1.7530864197530865e-05, |
|
"loss": 0.3328, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6202600808654791, |
|
"precision": 0.6739491807171694, |
|
"recall": 0.5744939271255061, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8670041417395307, |
|
"precision": 0.8730305838739574, |
|
"recall": 0.8610603290676416, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9109892729439809, |
|
"precision": 0.9097314797181489, |
|
"recall": 0.9122505490308412, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8872356123954747, |
|
"precision": 0.8677611401767996, |
|
"recall": 0.9076042518397384, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8568955223880597, |
|
"eval_loss": 0.5894299149513245, |
|
"eval_macro avg": { |
|
"f1-score": 0.8213722769861164, |
|
"precision": 0.8311180961215189, |
|
"recall": 0.8138522642659318, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9037, |
|
"eval_samples_per_second": 16.518, |
|
"eval_steps_per_second": 2.243, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8539713289140156, |
|
"precision": 0.8526463291050193, |
|
"recall": 0.8568955223880597, |
|
"support": 33500.0 |
|
}, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6441500279902966, |
|
"precision": 0.5974385600553825, |
|
"recall": 0.6987854251012146, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.834510811389424, |
|
"precision": 0.7849375755134917, |
|
"recall": 0.8907678244972578, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9059161060546101, |
|
"precision": 0.9398542543364466, |
|
"recall": 0.874343550081161, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8801401497053671, |
|
"precision": 0.8915849251419721, |
|
"recall": 0.8689854707843261, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8469850746268657, |
|
"eval_loss": 0.5878348350524902, |
|
"eval_macro avg": { |
|
"f1-score": 0.8161792737849245, |
|
"precision": 0.8034538287618231, |
|
"recall": 0.8332205676159898, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.9086, |
|
"eval_samples_per_second": 16.502, |
|
"eval_steps_per_second": 2.241, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8504184600736624, |
|
"precision": 0.8563340964894008, |
|
"recall": 0.8469850746268657, |
|
"support": 33500.0 |
|
}, |
|
"step": 648 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6323094193285029, |
|
"precision": 0.6375797489195307, |
|
"recall": 0.6271255060728745, |
|
"support": 4940.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8525914292124747, |
|
"precision": 0.8373732921992068, |
|
"recall": 0.8683729433272395, |
|
"support": 2188.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9054132151801194, |
|
"precision": 0.9134194927606647, |
|
"recall": 0.8975460708488494, |
|
"support": 10473.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8888055034396498, |
|
"precision": 0.883775884584292, |
|
"recall": 0.8938926976539405, |
|
"support": 15899.0 |
|
}, |
|
"eval_accuracy": 0.8540298507462687, |
|
"eval_loss": 0.7043101191520691, |
|
"eval_macro avg": { |
|
"f1-score": 0.8197798917901866, |
|
"precision": 0.8180371046159236, |
|
"recall": 0.821734304475726, |
|
"support": 33500.0 |
|
}, |
|
"eval_runtime": 4.935, |
|
"eval_samples_per_second": 16.414, |
|
"eval_steps_per_second": 2.229, |
|
"eval_weighted avg": { |
|
"f1-score": 0.853808653145316, |
|
"precision": 0.8537078167069386, |
|
"recall": 0.8540298507462687, |
|
"support": 33500.0 |
|
}, |
|
"step": 729 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4050, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 1290079654806600.0, |
|
"train_batch_size": 4, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|