{ "best_global_step": 2632, "best_metric": 0.4779825967353135, "best_model_checkpoint": "./segment-base-freezed-results-6969/checkpoint-2632", "epoch": 7.0, "eval_steps": 500, "global_step": 2632, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.8237275449101796, "eval_f1": 0.3313072949886817, "eval_loss": 0.5073999762535095, "eval_precision": 0.5454317269076305, "eval_recall": 0.34907830204633855, "eval_runtime": 4.5501, "eval_samples_per_second": 587.239, "eval_steps_per_second": 9.231, "step": 376 }, { "epoch": 1.3297872340425532, "grad_norm": 0.5485729575157166, "learning_rate": 9.98e-05, "loss": 0.5835, "step": 500 }, { "epoch": 2.0, "eval_accuracy": 0.8304640718562875, "eval_f1": 0.39590410126027326, "eval_loss": 0.482469379901886, "eval_precision": 0.6605972418855854, "eval_recall": 0.38597765077906376, "eval_runtime": 4.5616, "eval_samples_per_second": 585.765, "eval_steps_per_second": 9.207, "step": 752 }, { "epoch": 2.6595744680851063, "grad_norm": 0.6865694522857666, "learning_rate": 9.727322404371585e-05, "loss": 0.4701, "step": 1000 }, { "epoch": 3.0, "eval_accuracy": 0.8383233532934131, "eval_f1": 0.46028878960226666, "eval_loss": 0.46620744466781616, "eval_precision": 0.6894544615241363, "eval_recall": 0.4443744036963646, "eval_runtime": 4.561, "eval_samples_per_second": 585.832, "eval_steps_per_second": 9.208, "step": 1128 }, { "epoch": 3.9893617021276597, "grad_norm": 0.7495972514152527, "learning_rate": 9.454098360655738e-05, "loss": 0.4695, "step": 1500 }, { "epoch": 4.0, "eval_accuracy": 0.8409431137724551, "eval_f1": 0.4762458332322515, "eval_loss": 0.4532054364681244, "eval_precision": 0.6477548490754955, "eval_recall": 0.45254045291953454, "eval_runtime": 4.555, "eval_samples_per_second": 586.614, "eval_steps_per_second": 9.221, "step": 1504 }, { "epoch": 5.0, "eval_accuracy": 0.8390718562874252, "eval_f1": 0.47448273231679866, "eval_loss": 0.4566827714443207, "eval_precision": 0.63084183828443, "eval_recall": 0.4594250276812524, "eval_runtime": 4.5703, "eval_samples_per_second": 584.641, "eval_steps_per_second": 9.19, "step": 1880 }, { "epoch": 5.319148936170213, "grad_norm": 0.6681276559829712, "learning_rate": 9.180874316939892e-05, "loss": 0.4604, "step": 2000 }, { "epoch": 6.0, "eval_accuracy": 0.8413173652694611, "eval_f1": 0.4747950596602187, "eval_loss": 0.45092836022377014, "eval_precision": 0.6538129274551482, "eval_recall": 0.4443024483948064, "eval_runtime": 4.5601, "eval_samples_per_second": 585.954, "eval_steps_per_second": 9.21, "step": 2256 }, { "epoch": 6.648936170212766, "grad_norm": 0.5326411128044128, "learning_rate": 8.907650273224044e-05, "loss": 0.4577, "step": 2500 }, { "epoch": 7.0, "eval_accuracy": 0.8413173652694611, "eval_f1": 0.4779825967353135, "eval_loss": 0.449787437915802, "eval_precision": 0.6573432134465932, "eval_recall": 0.4501210955075003, "eval_runtime": 4.5584, "eval_samples_per_second": 586.176, "eval_steps_per_second": 9.214, "step": 2632 } ], "logging_steps": 500, "max_steps": 18800, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 5, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 5534590741908480.0, "train_batch_size": 64, "trial_name": null, "trial_params": null }