{ "best_metric": 0.8408180526634443, "best_model_checkpoint": "/chronos_data/smangalik/beliefs_modeling/models/self-belief-classifier-roberta-large-4/checkpoint-400", "epoch": 11.926605504587156, "eval_steps": 50, "global_step": 650, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.92, "learning_rate": 9.800000000000001e-06, "loss": 0.6617, "step": 50 }, { "epoch": 0.92, "eval_accuracy": 0.8205128205128205, "eval_f1": 0.819110295968641, "eval_loss": 0.4295506179332733, "eval_precision": 0.8192280280764046, "eval_recall": 0.8205128205128205, "eval_runtime": 3.9576, "eval_samples_per_second": 128.108, "eval_steps_per_second": 16.171, "step": 50 }, { "epoch": 1.83, "learning_rate": 9.815094339622643e-06, "loss": 0.3715, "step": 100 }, { "epoch": 1.83, "eval_accuracy": 0.8303747534516766, "eval_f1": 0.8353461502742431, "eval_loss": 0.4670024514198303, "eval_precision": 0.8434047624966725, "eval_recall": 0.8303747534516766, "eval_runtime": 3.9366, "eval_samples_per_second": 128.79, "eval_steps_per_second": 16.258, "step": 100 }, { "epoch": 2.75, "learning_rate": 9.626415094339624e-06, "loss": 0.2344, "step": 150 }, { "epoch": 2.75, "eval_accuracy": 0.814595660749507, "eval_f1": 0.8244485345966336, "eval_loss": 0.6940962672233582, "eval_precision": 0.8428588493485568, "eval_recall": 0.814595660749507, "eval_runtime": 3.4428, "eval_samples_per_second": 147.263, "eval_steps_per_second": 18.589, "step": 150 }, { "epoch": 3.67, "learning_rate": 9.437735849056604e-06, "loss": 0.1797, "step": 200 }, { "epoch": 3.67, "eval_accuracy": 0.8264299802761341, "eval_f1": 0.8329637103282812, "eval_loss": 0.7602464556694031, "eval_precision": 0.8480073311662002, "eval_recall": 0.8264299802761341, "eval_runtime": 3.5906, "eval_samples_per_second": 141.203, "eval_steps_per_second": 17.824, "step": 200 }, { "epoch": 4.59, "learning_rate": 9.252830188679246e-06, "loss": 0.1187, "step": 250 }, { "epoch": 4.59, "eval_accuracy": 0.8165680473372781, "eval_f1": 0.8260410505358732, "eval_loss": 1.040390133857727, "eval_precision": 0.8445598652695405, "eval_recall": 0.8165680473372781, "eval_runtime": 3.1667, "eval_samples_per_second": 160.104, "eval_steps_per_second": 20.21, "step": 250 }, { "epoch": 5.5, "learning_rate": 9.067924528301889e-06, "loss": 0.067, "step": 300 }, { "epoch": 5.5, "eval_accuracy": 0.8264299802761341, "eval_f1": 0.8313863456050801, "eval_loss": 1.0527454614639282, "eval_precision": 0.8389317220188415, "eval_recall": 0.8264299802761341, "eval_runtime": 4.2619, "eval_samples_per_second": 118.962, "eval_steps_per_second": 15.017, "step": 300 }, { "epoch": 6.42, "learning_rate": 8.879245283018869e-06, "loss": 0.0635, "step": 350 }, { "epoch": 6.42, "eval_accuracy": 0.8303747534516766, "eval_f1": 0.8376041385770543, "eval_loss": 1.1337926387786865, "eval_precision": 0.8504492855502807, "eval_recall": 0.8303747534516766, "eval_runtime": 4.0094, "eval_samples_per_second": 126.454, "eval_steps_per_second": 15.963, "step": 350 }, { "epoch": 7.34, "learning_rate": 8.69433962264151e-06, "loss": 0.0254, "step": 400 }, { "epoch": 7.34, "eval_accuracy": 0.8382642998027613, "eval_f1": 0.8408180526634443, "eval_loss": 1.1419103145599365, "eval_precision": 0.8458355761491414, "eval_recall": 0.8382642998027613, "eval_runtime": 3.6866, "eval_samples_per_second": 137.524, "eval_steps_per_second": 17.36, "step": 400 }, { "epoch": 8.26, "learning_rate": 8.505660377358492e-06, "loss": 0.0374, "step": 450 }, { "epoch": 8.26, "eval_accuracy": 0.8284023668639053, "eval_f1": 0.8320464737199128, "eval_loss": 1.2373206615447998, "eval_precision": 0.8369363588201497, "eval_recall": 0.8284023668639053, "eval_runtime": 4.0231, "eval_samples_per_second": 126.021, "eval_steps_per_second": 15.908, "step": 450 }, { "epoch": 9.17, "learning_rate": 8.316981132075472e-06, "loss": 0.013, "step": 500 }, { "epoch": 9.17, "eval_accuracy": 0.834319526627219, "eval_f1": 0.8376685641339108, "eval_loss": 1.2268174886703491, "eval_precision": 0.8421800999981714, "eval_recall": 0.834319526627219, "eval_runtime": 4.1413, "eval_samples_per_second": 122.425, "eval_steps_per_second": 15.454, "step": 500 }, { "epoch": 10.09, "learning_rate": 8.128301886792453e-06, "loss": 0.0213, "step": 550 }, { "epoch": 10.09, "eval_accuracy": 0.834319526627219, "eval_f1": 0.8396773850135992, "eval_loss": 1.2791889905929565, "eval_precision": 0.8499112935552067, "eval_recall": 0.834319526627219, "eval_runtime": 4.1859, "eval_samples_per_second": 121.122, "eval_steps_per_second": 15.29, "step": 550 }, { "epoch": 11.01, "learning_rate": 7.939622641509435e-06, "loss": 0.0003, "step": 600 }, { "epoch": 11.01, "eval_accuracy": 0.8303747534516766, "eval_f1": 0.8359161169722349, "eval_loss": 1.3518141508102417, "eval_precision": 0.8446374502780472, "eval_recall": 0.8303747534516766, "eval_runtime": 3.09, "eval_samples_per_second": 164.08, "eval_steps_per_second": 20.712, "step": 600 }, { "epoch": 11.93, "learning_rate": 7.750943396226415e-06, "loss": 0.0313, "step": 650 }, { "epoch": 11.93, "eval_accuracy": 0.8382642998027613, "eval_f1": 0.8405182086840655, "eval_loss": 1.3090877532958984, "eval_precision": 0.8442165138341221, "eval_recall": 0.8382642998027613, "eval_runtime": 4.7065, "eval_samples_per_second": 107.722, "eval_steps_per_second": 13.598, "step": 650 } ], "logging_steps": 50, "max_steps": 2700, "num_train_epochs": 50, "save_steps": 50, "total_flos": 2261979798655680.0, "trial_name": null, "trial_params": null }