{ "best_metric": 0.6532846715328468, "best_model_checkpoint": "./outputs/en_es_multilingual/mdeberta-v3-base-output/met_xnli_test_en_8_0.01_0.00005_11-17-23_09-47/checkpoint-3630", "epoch": 4.0, "global_step": 7260, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 3.989595545134818e-05, "loss": 0.0887, "step": 1815 }, { "epoch": 1.0, "eval_accuracy": 0.9858611825192802, "eval_f1": 0.6258389261744967, "eval_loss": 0.04259440675377846, "eval_precision": 0.6109746109746109, "eval_recall": 0.641444539982803, "eval_runtime": 14.5185, "eval_samples_per_second": 334.951, "eval_steps_per_second": 41.877, "step": 1815 }, { "epoch": 2.0, "learning_rate": 2.6597303634232123e-05, "loss": 0.0228, "step": 3630 }, { "epoch": 2.0, "eval_accuracy": 0.9879240851820115, "eval_f1": 0.6532846715328468, "eval_loss": 0.034684374928474426, "eval_precision": 0.6958211856171039, "eval_recall": 0.6156491831470335, "eval_runtime": 13.7183, "eval_samples_per_second": 354.489, "eval_steps_per_second": 44.32, "step": 3630 }, { "epoch": 3.0, "learning_rate": 1.3298651817116062e-05, "loss": 0.0104, "step": 5445 }, { "epoch": 3.0, "eval_accuracy": 0.9885270874988099, "eval_f1": 0.6226415094339622, "eval_loss": 0.05654400959610939, "eval_precision": 0.7973154362416107, "eval_recall": 0.5107480653482374, "eval_runtime": 12.5259, "eval_samples_per_second": 388.237, "eval_steps_per_second": 48.54, "step": 5445 }, { "epoch": 4.0, "learning_rate": 0.0, "loss": 0.0046, "step": 7260 }, { "epoch": 4.0, "eval_accuracy": 0.9881779808943476, "eval_f1": 0.6463007159904535, "eval_loss": 0.05788963660597801, "eval_precision": 0.7263948497854077, "eval_recall": 0.5821152192605331, "eval_runtime": 13.3972, "eval_samples_per_second": 362.986, "eval_steps_per_second": 45.383, "step": 7260 }, { "epoch": 4.0, "step": 7260, "total_flos": 1062049033953072.0, "train_loss": 0.031637020347532165, "train_runtime": 972.4399, "train_samples_per_second": 59.722, "train_steps_per_second": 7.466 } ], "max_steps": 7260, "num_train_epochs": 4, "total_flos": 1062049033953072.0, "trial_name": null, "trial_params": null }