Chenghao-Qiu's picture
Upload folder using huggingface_hub
2927dac verified
{
"best_metric": 0.5993899703025818,
"best_model_checkpoint": "output_pipe/H3K4me2/origin/checkpoint-600",
"epoch": 4.0,
"eval_steps": 200,
"global_step": 1536,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.2604166666666667,
"grad_norm": 1.312898874282837,
"learning_rate": 2.8990578734858683e-05,
"loss": 0.6687,
"step": 100
},
{
"epoch": 0.5208333333333334,
"grad_norm": 2.9508161544799805,
"learning_rate": 2.6971736204576044e-05,
"loss": 0.6281,
"step": 200
},
{
"epoch": 0.5208333333333334,
"eval_accuracy": 0.6285434995112414,
"eval_f1": 0.5024471908501684,
"eval_loss": 0.6490753889083862,
"eval_matthews_correlation": 0.2086399181537894,
"eval_precision": 0.6864785107900588,
"eval_recall": 0.5583587557391902,
"eval_runtime": 1.8488,
"eval_samples_per_second": 1660.0,
"eval_steps_per_second": 25.963,
"step": 200
},
{
"epoch": 0.78125,
"grad_norm": 0.962492048740387,
"learning_rate": 2.4952893674293406e-05,
"loss": 0.6215,
"step": 300
},
{
"epoch": 1.0416666666666667,
"grad_norm": 2.185643196105957,
"learning_rate": 2.293405114401077e-05,
"loss": 0.6117,
"step": 400
},
{
"epoch": 1.0416666666666667,
"eval_accuracy": 0.6614532420984034,
"eval_f1": 0.6577790055568811,
"eval_loss": 0.610870361328125,
"eval_matthews_correlation": 0.3219078238538063,
"eval_precision": 0.6586412781887111,
"eval_recall": 0.6633002586738914,
"eval_runtime": 1.8461,
"eval_samples_per_second": 1662.442,
"eval_steps_per_second": 26.001,
"step": 400
},
{
"epoch": 1.3020833333333333,
"grad_norm": 1.5712463855743408,
"learning_rate": 2.091520861372813e-05,
"loss": 0.5579,
"step": 500
},
{
"epoch": 1.5625,
"grad_norm": 1.733756422996521,
"learning_rate": 1.8896366083445493e-05,
"loss": 0.5406,
"step": 600
},
{
"epoch": 1.5625,
"eval_accuracy": 0.6656891495601173,
"eval_f1": 0.6606768458059544,
"eval_loss": 0.5993899703025818,
"eval_matthews_correlation": 0.32485375836499847,
"eval_precision": 0.6603972055360026,
"eval_recall": 0.6644822364130554,
"eval_runtime": 1.8474,
"eval_samples_per_second": 1661.26,
"eval_steps_per_second": 25.983,
"step": 600
},
{
"epoch": 1.8229166666666665,
"grad_norm": 1.8414597511291504,
"learning_rate": 1.6877523553162854e-05,
"loss": 0.5476,
"step": 700
},
{
"epoch": 2.0833333333333335,
"grad_norm": 3.3911778926849365,
"learning_rate": 1.4858681022880215e-05,
"loss": 0.4847,
"step": 800
},
{
"epoch": 2.0833333333333335,
"eval_accuracy": 0.6764418377321603,
"eval_f1": 0.6664955835944539,
"eval_loss": 0.6927724480628967,
"eval_matthews_correlation": 0.33299131530494724,
"eval_precision": 0.6665149724192277,
"eval_recall": 0.66647634512612,
"eval_runtime": 1.8456,
"eval_samples_per_second": 1662.868,
"eval_steps_per_second": 26.008,
"step": 800
},
{
"epoch": 2.34375,
"grad_norm": 4.598505973815918,
"learning_rate": 1.2839838492597578e-05,
"loss": 0.3215,
"step": 900
},
{
"epoch": 2.6041666666666665,
"grad_norm": 6.187351226806641,
"learning_rate": 1.082099596231494e-05,
"loss": 0.2986,
"step": 1000
},
{
"epoch": 2.6041666666666665,
"eval_accuracy": 0.6722059302704464,
"eval_f1": 0.6665124930330224,
"eval_loss": 0.7655965089797974,
"eval_matthews_correlation": 0.3354089433290383,
"eval_precision": 0.665851832445941,
"eval_recall": 0.6695778056925763,
"eval_runtime": 1.8471,
"eval_samples_per_second": 1661.506,
"eval_steps_per_second": 25.986,
"step": 1000
},
{
"epoch": 2.8645833333333335,
"grad_norm": 6.935540199279785,
"learning_rate": 8.8021534320323e-06,
"loss": 0.2776,
"step": 1100
},
{
"epoch": 3.125,
"grad_norm": 3.6287009716033936,
"learning_rate": 6.7833109017496635e-06,
"loss": 0.165,
"step": 1200
},
{
"epoch": 3.125,
"eval_accuracy": 0.6715542521994134,
"eval_f1": 0.6602836723667622,
"eval_loss": 1.1591715812683105,
"eval_matthews_correlation": 0.3207000488328631,
"eval_precision": 0.660941771459814,
"eval_recall": 0.659760453095114,
"eval_runtime": 1.8438,
"eval_samples_per_second": 1664.518,
"eval_steps_per_second": 26.034,
"step": 1200
},
{
"epoch": 3.3854166666666665,
"grad_norm": 3.4551613330841064,
"learning_rate": 4.764468371467026e-06,
"loss": 0.0605,
"step": 1300
},
{
"epoch": 3.6458333333333335,
"grad_norm": 1.9309793710708618,
"learning_rate": 2.7456258411843877e-06,
"loss": 0.0536,
"step": 1400
},
{
"epoch": 3.6458333333333335,
"eval_accuracy": 0.6614532420984034,
"eval_f1": 0.6480922910837987,
"eval_loss": 1.3020259141921997,
"eval_matthews_correlation": 0.2968783195103293,
"eval_precision": 0.6497979913241463,
"eval_recall": 0.6470926542742468,
"eval_runtime": 1.8472,
"eval_samples_per_second": 1661.427,
"eval_steps_per_second": 25.985,
"step": 1400
},
{
"epoch": 3.90625,
"grad_norm": 6.031075954437256,
"learning_rate": 7.267833109017497e-07,
"loss": 0.0562,
"step": 1500
},
{
"epoch": 4.0,
"step": 1536,
"total_flos": 2.50013189805102e+16,
"train_loss": 0.38483377111454803,
"train_runtime": 235.9383,
"train_samples_per_second": 416.126,
"train_steps_per_second": 6.51
}
],
"logging_steps": 100,
"max_steps": 1536,
"num_input_tokens_seen": 0,
"num_train_epochs": 4,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 2.50013189805102e+16,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}