{ "best_metric": 0.9884615384615384, "best_model_checkpoint": "./results/checkpoint-30", "epoch": 1.0, "eval_steps": 5, "global_step": 38, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "eval_accuracy": 0.43902439024390244, "eval_f1": 0.7958371594735232, "eval_loss": 0.8333200216293335, "eval_precision": 0.43807919123841615, "eval_recall": 1.0, "eval_roc_auc": 0.5014947683109118, "eval_runtime": 52.2016, "eval_samples_per_second": 22.777, "eval_steps_per_second": 0.364, "step": 0 }, { "epoch": 0.13157894736842105, "grad_norm": 499350.4375, "learning_rate": 2.5e-05, "loss": 0.7332, "step": 5 }, { "epoch": 0.13157894736842105, "eval_accuracy": 0.6181665264928511, "eval_f1": 0.1537744641192917, "eval_loss": 0.6050995588302612, "eval_precision": 1.0, "eval_recall": 0.12692307692307692, "eval_roc_auc": 0.5634615384615385, "eval_runtime": 52.7835, "eval_samples_per_second": 22.526, "eval_steps_per_second": 0.36, "step": 5 }, { "epoch": 0.2631578947368421, "grad_norm": 544000.625, "learning_rate": 5e-05, "loss": 0.5445, "step": 10 }, { "epoch": 0.2631578947368421, "eval_accuracy": 0.8275862068965517, "eval_f1": 0.9246697607997144, "eval_loss": 0.3963133990764618, "eval_precision": 0.7184466019417476, "eval_recall": 0.9961538461538462, "eval_roc_auc": 0.8463579395193745, "eval_runtime": 51.9808, "eval_samples_per_second": 22.874, "eval_steps_per_second": 0.366, "step": 10 }, { "epoch": 0.39473684210526316, "grad_norm": 215321.078125, "learning_rate": 4.107142857142857e-05, "loss": 0.328, "step": 15 }, { "epoch": 0.39473684210526316, "eval_accuracy": 0.928511354079058, "eval_f1": 0.9660574412532638, "eval_loss": 0.2025815099477768, "eval_precision": 0.8618968386023295, "eval_recall": 0.9961538461538462, "eval_roc_auc": 0.9360440381740831, "eval_runtime": 52.187, "eval_samples_per_second": 22.783, "eval_steps_per_second": 0.364, "step": 15 }, { "epoch": 0.5263157894736842, "grad_norm": 447920.53125, "learning_rate": 3.2142857142857144e-05, "loss": 0.2165, "step": 20 }, { "epoch": 0.5263157894736842, "eval_accuracy": 0.9865433137089992, "eval_f1": 0.9799382716049382, "eval_loss": 0.061642639338970184, "eval_precision": 0.9921875, "eval_recall": 0.9769230769230769, "eval_roc_auc": 0.9854720018397148, "eval_runtime": 51.8127, "eval_samples_per_second": 22.948, "eval_steps_per_second": 0.367, "step": 20 }, { "epoch": 0.6578947368421053, "grad_norm": 41190.76953125, "learning_rate": 2.3214285714285715e-05, "loss": 0.0754, "step": 25 }, { "epoch": 0.6578947368421053, "eval_accuracy": 0.9806560134566863, "eval_f1": 0.9854573287409109, "eval_loss": 0.050207946449518204, "eval_precision": 0.9662288930581614, "eval_recall": 0.9903846153846154, "eval_roc_auc": 0.9817393928941014, "eval_runtime": 51.4902, "eval_samples_per_second": 23.092, "eval_steps_per_second": 0.369, "step": 25 }, { "epoch": 0.7894736842105263, "grad_norm": 14033.9931640625, "learning_rate": 1.4285714285714285e-05, "loss": 0.022, "step": 30 }, { "epoch": 0.7894736842105263, "eval_accuracy": 0.9899074852817493, "eval_f1": 0.9884615384615384, "eval_loss": 0.03608058765530586, "eval_precision": 0.9884615384615385, "eval_recall": 0.9884615384615385, "eval_roc_auc": 0.9897464642980338, "eval_runtime": 51.3673, "eval_samples_per_second": 23.147, "eval_steps_per_second": 0.37, "step": 30 }, { "epoch": 0.9210526315789473, "grad_norm": 249264.84375, "learning_rate": 5.357142857142857e-06, "loss": 0.1406, "step": 35 }, { "epoch": 0.9210526315789473, "eval_accuracy": 0.9915895710681245, "eval_f1": 0.9880585516178735, "eval_loss": 0.031022196635603905, "eval_precision": 0.9941860465116279, "eval_recall": 0.9865384615384616, "eval_roc_auc": 0.9910270783028631, "eval_runtime": 50.7403, "eval_samples_per_second": 23.433, "eval_steps_per_second": 0.374, "step": 35 } ], "logging_steps": 5, "max_steps": 38, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 150, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 8.0526013794091e+16, "train_batch_size": 32, "trial_name": null, "trial_params": null }