|
{ |
|
"best_metric": 0.5993899703025818, |
|
"best_model_checkpoint": "output_pipe/H3K4me2/origin/checkpoint-600", |
|
"epoch": 4.0, |
|
"eval_steps": 200, |
|
"global_step": 1536, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.2604166666666667, |
|
"grad_norm": 1.312898874282837, |
|
"learning_rate": 2.8990578734858683e-05, |
|
"loss": 0.6687, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.5208333333333334, |
|
"grad_norm": 2.9508161544799805, |
|
"learning_rate": 2.6971736204576044e-05, |
|
"loss": 0.6281, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.5208333333333334, |
|
"eval_accuracy": 0.6285434995112414, |
|
"eval_f1": 0.5024471908501684, |
|
"eval_loss": 0.6490753889083862, |
|
"eval_matthews_correlation": 0.2086399181537894, |
|
"eval_precision": 0.6864785107900588, |
|
"eval_recall": 0.5583587557391902, |
|
"eval_runtime": 1.8488, |
|
"eval_samples_per_second": 1660.0, |
|
"eval_steps_per_second": 25.963, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.78125, |
|
"grad_norm": 0.962492048740387, |
|
"learning_rate": 2.4952893674293406e-05, |
|
"loss": 0.6215, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.0416666666666667, |
|
"grad_norm": 2.185643196105957, |
|
"learning_rate": 2.293405114401077e-05, |
|
"loss": 0.6117, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.0416666666666667, |
|
"eval_accuracy": 0.6614532420984034, |
|
"eval_f1": 0.6577790055568811, |
|
"eval_loss": 0.610870361328125, |
|
"eval_matthews_correlation": 0.3219078238538063, |
|
"eval_precision": 0.6586412781887111, |
|
"eval_recall": 0.6633002586738914, |
|
"eval_runtime": 1.8461, |
|
"eval_samples_per_second": 1662.442, |
|
"eval_steps_per_second": 26.001, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.3020833333333333, |
|
"grad_norm": 1.5712463855743408, |
|
"learning_rate": 2.091520861372813e-05, |
|
"loss": 0.5579, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.5625, |
|
"grad_norm": 1.733756422996521, |
|
"learning_rate": 1.8896366083445493e-05, |
|
"loss": 0.5406, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.5625, |
|
"eval_accuracy": 0.6656891495601173, |
|
"eval_f1": 0.6606768458059544, |
|
"eval_loss": 0.5993899703025818, |
|
"eval_matthews_correlation": 0.32485375836499847, |
|
"eval_precision": 0.6603972055360026, |
|
"eval_recall": 0.6644822364130554, |
|
"eval_runtime": 1.8474, |
|
"eval_samples_per_second": 1661.26, |
|
"eval_steps_per_second": 25.983, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.8229166666666665, |
|
"grad_norm": 1.8414597511291504, |
|
"learning_rate": 1.6877523553162854e-05, |
|
"loss": 0.5476, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.0833333333333335, |
|
"grad_norm": 3.3911778926849365, |
|
"learning_rate": 1.4858681022880215e-05, |
|
"loss": 0.4847, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.0833333333333335, |
|
"eval_accuracy": 0.6764418377321603, |
|
"eval_f1": 0.6664955835944539, |
|
"eval_loss": 0.6927724480628967, |
|
"eval_matthews_correlation": 0.33299131530494724, |
|
"eval_precision": 0.6665149724192277, |
|
"eval_recall": 0.66647634512612, |
|
"eval_runtime": 1.8456, |
|
"eval_samples_per_second": 1662.868, |
|
"eval_steps_per_second": 26.008, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.34375, |
|
"grad_norm": 4.598505973815918, |
|
"learning_rate": 1.2839838492597578e-05, |
|
"loss": 0.3215, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.6041666666666665, |
|
"grad_norm": 6.187351226806641, |
|
"learning_rate": 1.082099596231494e-05, |
|
"loss": 0.2986, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.6041666666666665, |
|
"eval_accuracy": 0.6722059302704464, |
|
"eval_f1": 0.6665124930330224, |
|
"eval_loss": 0.7655965089797974, |
|
"eval_matthews_correlation": 0.3354089433290383, |
|
"eval_precision": 0.665851832445941, |
|
"eval_recall": 0.6695778056925763, |
|
"eval_runtime": 1.8471, |
|
"eval_samples_per_second": 1661.506, |
|
"eval_steps_per_second": 25.986, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.8645833333333335, |
|
"grad_norm": 6.935540199279785, |
|
"learning_rate": 8.8021534320323e-06, |
|
"loss": 0.2776, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.125, |
|
"grad_norm": 3.6287009716033936, |
|
"learning_rate": 6.7833109017496635e-06, |
|
"loss": 0.165, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.125, |
|
"eval_accuracy": 0.6715542521994134, |
|
"eval_f1": 0.6602836723667622, |
|
"eval_loss": 1.1591715812683105, |
|
"eval_matthews_correlation": 0.3207000488328631, |
|
"eval_precision": 0.660941771459814, |
|
"eval_recall": 0.659760453095114, |
|
"eval_runtime": 1.8438, |
|
"eval_samples_per_second": 1664.518, |
|
"eval_steps_per_second": 26.034, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.3854166666666665, |
|
"grad_norm": 3.4551613330841064, |
|
"learning_rate": 4.764468371467026e-06, |
|
"loss": 0.0605, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.6458333333333335, |
|
"grad_norm": 1.9309793710708618, |
|
"learning_rate": 2.7456258411843877e-06, |
|
"loss": 0.0536, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.6458333333333335, |
|
"eval_accuracy": 0.6614532420984034, |
|
"eval_f1": 0.6480922910837987, |
|
"eval_loss": 1.3020259141921997, |
|
"eval_matthews_correlation": 0.2968783195103293, |
|
"eval_precision": 0.6497979913241463, |
|
"eval_recall": 0.6470926542742468, |
|
"eval_runtime": 1.8472, |
|
"eval_samples_per_second": 1661.427, |
|
"eval_steps_per_second": 25.985, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.90625, |
|
"grad_norm": 6.031075954437256, |
|
"learning_rate": 7.267833109017497e-07, |
|
"loss": 0.0562, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"step": 1536, |
|
"total_flos": 2.50013189805102e+16, |
|
"train_loss": 0.38483377111454803, |
|
"train_runtime": 235.9383, |
|
"train_samples_per_second": 416.126, |
|
"train_steps_per_second": 6.51 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 1536, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 4, |
|
"save_steps": 200, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 2.50013189805102e+16, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|