longformer-spans / checkpoint-243 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 3, checkpoint
5df034f verified
raw
history blame
3.87 kB
{
"best_metric": 0.2252955436706543,
"best_model_checkpoint": "longformer-spans/checkpoint-162",
"epoch": 3.0,
"eval_steps": 500,
"global_step": 243,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B": {
"f1-score": 0.816,
"precision": 0.7461594732991953,
"recall": 0.9002647837599294,
"support": 1133.0
},
"eval_I": {
"f1-score": 0.9321376763813793,
"precision": 0.9024103768767235,
"recall": 0.9638902525500463,
"support": 18333.0
},
"eval_O": {
"f1-score": 0.8560784528570645,
"precision": 0.931782945736434,
"recall": 0.7917511147142278,
"support": 9868.0
},
"eval_accuracy": 0.9035249198881844,
"eval_loss": 0.2619660496711731,
"eval_macro avg": {
"f1-score": 0.8680720430794812,
"precision": 0.860117598637451,
"recall": 0.8853020503414012,
"support": 29334.0
},
"eval_runtime": 5.5032,
"eval_samples_per_second": 14.537,
"eval_steps_per_second": 1.817,
"eval_weighted avg": {
"f1-score": 0.9020655278480035,
"precision": 0.9062562975065145,
"recall": 0.9035249198881844,
"support": 29334.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_B": {
"f1-score": 0.8512256973795435,
"precision": 0.8167072181670721,
"recall": 0.8887908208296558,
"support": 1133.0
},
"eval_I": {
"f1-score": 0.9416781438711729,
"precision": 0.9152551099212274,
"recall": 0.9696721758577429,
"support": 18333.0
},
"eval_O": {
"f1-score": 0.8778173190984578,
"precision": 0.9380041484212952,
"recall": 0.8248885285772193,
"support": 9868.0
},
"eval_accuracy": 0.9178427763005387,
"eval_loss": 0.2252955436706543,
"eval_macro avg": {
"f1-score": 0.8902403867830581,
"precision": 0.8899888255031981,
"recall": 0.8944505084215394,
"support": 29334.0
},
"eval_runtime": 5.4972,
"eval_samples_per_second": 14.553,
"eval_steps_per_second": 1.819,
"eval_weighted avg": {
"f1-score": 0.9167016237671239,
"precision": 0.9191015935430046,
"recall": 0.9178427763005387,
"support": 29334.0
},
"step": 162
},
{
"epoch": 3.0,
"eval_B": {
"f1-score": 0.8531120331950207,
"precision": 0.8050117462803446,
"recall": 0.9073256840247131,
"support": 1133.0
},
"eval_I": {
"f1-score": 0.9469915571230095,
"precision": 0.9280963603037444,
"recall": 0.9666721213112965,
"support": 18333.0
},
"eval_O": {
"f1-score": 0.8903876792352629,
"precision": 0.9353938852934612,
"recall": 0.8495135792460479,
"support": 9868.0
},
"eval_accuracy": 0.9249676143724006,
"eval_loss": 0.22786012291908264,
"eval_macro avg": {
"f1-score": 0.8968304231844311,
"precision": 0.8895006639591835,
"recall": 0.9078371281940192,
"support": 29334.0
},
"eval_runtime": 5.5036,
"eval_samples_per_second": 14.536,
"eval_steps_per_second": 1.817,
"eval_weighted avg": {
"f1-score": 0.9243239165827936,
"precision": 0.9257972230878861,
"recall": 0.9249676143724006,
"support": 29334.0
},
"step": 243
}
],
"logging_steps": 500,
"max_steps": 1620,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 431359958206800.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}