|
{ |
|
"best_metric": 0.8408180526634443, |
|
"best_model_checkpoint": "/chronos_data/smangalik/beliefs_modeling/models/self-belief-classifier-roberta-large-4/checkpoint-400", |
|
"epoch": 11.926605504587156, |
|
"eval_steps": 50, |
|
"global_step": 650, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.92, |
|
"learning_rate": 9.800000000000001e-06, |
|
"loss": 0.6617, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"eval_accuracy": 0.8205128205128205, |
|
"eval_f1": 0.819110295968641, |
|
"eval_loss": 0.4295506179332733, |
|
"eval_precision": 0.8192280280764046, |
|
"eval_recall": 0.8205128205128205, |
|
"eval_runtime": 3.9576, |
|
"eval_samples_per_second": 128.108, |
|
"eval_steps_per_second": 16.171, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"learning_rate": 9.815094339622643e-06, |
|
"loss": 0.3715, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_accuracy": 0.8303747534516766, |
|
"eval_f1": 0.8353461502742431, |
|
"eval_loss": 0.4670024514198303, |
|
"eval_precision": 0.8434047624966725, |
|
"eval_recall": 0.8303747534516766, |
|
"eval_runtime": 3.9366, |
|
"eval_samples_per_second": 128.79, |
|
"eval_steps_per_second": 16.258, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.75, |
|
"learning_rate": 9.626415094339624e-06, |
|
"loss": 0.2344, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 2.75, |
|
"eval_accuracy": 0.814595660749507, |
|
"eval_f1": 0.8244485345966336, |
|
"eval_loss": 0.6940962672233582, |
|
"eval_precision": 0.8428588493485568, |
|
"eval_recall": 0.814595660749507, |
|
"eval_runtime": 3.4428, |
|
"eval_samples_per_second": 147.263, |
|
"eval_steps_per_second": 18.589, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"learning_rate": 9.437735849056604e-06, |
|
"loss": 0.1797, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"eval_accuracy": 0.8264299802761341, |
|
"eval_f1": 0.8329637103282812, |
|
"eval_loss": 0.7602464556694031, |
|
"eval_precision": 0.8480073311662002, |
|
"eval_recall": 0.8264299802761341, |
|
"eval_runtime": 3.5906, |
|
"eval_samples_per_second": 141.203, |
|
"eval_steps_per_second": 17.824, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"learning_rate": 9.252830188679246e-06, |
|
"loss": 0.1187, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"eval_accuracy": 0.8165680473372781, |
|
"eval_f1": 0.8260410505358732, |
|
"eval_loss": 1.040390133857727, |
|
"eval_precision": 0.8445598652695405, |
|
"eval_recall": 0.8165680473372781, |
|
"eval_runtime": 3.1667, |
|
"eval_samples_per_second": 160.104, |
|
"eval_steps_per_second": 20.21, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"learning_rate": 9.067924528301889e-06, |
|
"loss": 0.067, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"eval_accuracy": 0.8264299802761341, |
|
"eval_f1": 0.8313863456050801, |
|
"eval_loss": 1.0527454614639282, |
|
"eval_precision": 0.8389317220188415, |
|
"eval_recall": 0.8264299802761341, |
|
"eval_runtime": 4.2619, |
|
"eval_samples_per_second": 118.962, |
|
"eval_steps_per_second": 15.017, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"learning_rate": 8.879245283018869e-06, |
|
"loss": 0.0635, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"eval_accuracy": 0.8303747534516766, |
|
"eval_f1": 0.8376041385770543, |
|
"eval_loss": 1.1337926387786865, |
|
"eval_precision": 0.8504492855502807, |
|
"eval_recall": 0.8303747534516766, |
|
"eval_runtime": 4.0094, |
|
"eval_samples_per_second": 126.454, |
|
"eval_steps_per_second": 15.963, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"learning_rate": 8.69433962264151e-06, |
|
"loss": 0.0254, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"eval_accuracy": 0.8382642998027613, |
|
"eval_f1": 0.8408180526634443, |
|
"eval_loss": 1.1419103145599365, |
|
"eval_precision": 0.8458355761491414, |
|
"eval_recall": 0.8382642998027613, |
|
"eval_runtime": 3.6866, |
|
"eval_samples_per_second": 137.524, |
|
"eval_steps_per_second": 17.36, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 8.26, |
|
"learning_rate": 8.505660377358492e-06, |
|
"loss": 0.0374, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 8.26, |
|
"eval_accuracy": 0.8284023668639053, |
|
"eval_f1": 0.8320464737199128, |
|
"eval_loss": 1.2373206615447998, |
|
"eval_precision": 0.8369363588201497, |
|
"eval_recall": 0.8284023668639053, |
|
"eval_runtime": 4.0231, |
|
"eval_samples_per_second": 126.021, |
|
"eval_steps_per_second": 15.908, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"learning_rate": 8.316981132075472e-06, |
|
"loss": 0.013, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"eval_accuracy": 0.834319526627219, |
|
"eval_f1": 0.8376685641339108, |
|
"eval_loss": 1.2268174886703491, |
|
"eval_precision": 0.8421800999981714, |
|
"eval_recall": 0.834319526627219, |
|
"eval_runtime": 4.1413, |
|
"eval_samples_per_second": 122.425, |
|
"eval_steps_per_second": 15.454, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 10.09, |
|
"learning_rate": 8.128301886792453e-06, |
|
"loss": 0.0213, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 10.09, |
|
"eval_accuracy": 0.834319526627219, |
|
"eval_f1": 0.8396773850135992, |
|
"eval_loss": 1.2791889905929565, |
|
"eval_precision": 0.8499112935552067, |
|
"eval_recall": 0.834319526627219, |
|
"eval_runtime": 4.1859, |
|
"eval_samples_per_second": 121.122, |
|
"eval_steps_per_second": 15.29, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"learning_rate": 7.939622641509435e-06, |
|
"loss": 0.0003, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"eval_accuracy": 0.8303747534516766, |
|
"eval_f1": 0.8359161169722349, |
|
"eval_loss": 1.3518141508102417, |
|
"eval_precision": 0.8446374502780472, |
|
"eval_recall": 0.8303747534516766, |
|
"eval_runtime": 3.09, |
|
"eval_samples_per_second": 164.08, |
|
"eval_steps_per_second": 20.712, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 11.93, |
|
"learning_rate": 7.750943396226415e-06, |
|
"loss": 0.0313, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 11.93, |
|
"eval_accuracy": 0.8382642998027613, |
|
"eval_f1": 0.8405182086840655, |
|
"eval_loss": 1.3090877532958984, |
|
"eval_precision": 0.8442165138341221, |
|
"eval_recall": 0.8382642998027613, |
|
"eval_runtime": 4.7065, |
|
"eval_samples_per_second": 107.722, |
|
"eval_steps_per_second": 13.598, |
|
"step": 650 |
|
} |
|
], |
|
"logging_steps": 50, |
|
"max_steps": 2700, |
|
"num_train_epochs": 50, |
|
"save_steps": 50, |
|
"total_flos": 2261979798655680.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|