{ "best_metric": 0.39216598868370056, "best_model_checkpoint": "/scratch/hlv8980/Attack_Benchmark/models/hyena/tf4/origin/checkpoint-600", "epoch": 4.0, "global_step": 1188, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.34, "learning_rate": 2.8760984182776802e-05, "loss": 0.5992, "step": 100 }, { "epoch": 0.67, "learning_rate": 2.615114235500879e-05, "loss": 0.4813, "step": 200 }, { "epoch": 0.67, "eval_accuracy": 0.774, "eval_f1": 0.7713328260834371, "eval_loss": 0.48207539319992065, "eval_matthews_correlation": 0.5579338694412199, "eval_precision": 0.785067107786007, "eval_recall": 0.772997299729973, "eval_runtime": 0.1057, "eval_samples_per_second": 9462.679, "eval_steps_per_second": 151.403, "step": 200 }, { "epoch": 1.01, "learning_rate": 2.3514938488576452e-05, "loss": 0.4431, "step": 300 }, { "epoch": 1.35, "learning_rate": 2.087873462214411e-05, "loss": 0.377, "step": 400 }, { "epoch": 1.35, "eval_accuracy": 0.816, "eval_f1": 0.8159933757615274, "eval_loss": 0.427643358707428, "eval_matthews_correlation": 0.6320128653971173, "eval_precision": 0.815991263965056, "eval_recall": 0.816021602160216, "eval_runtime": 0.1039, "eval_samples_per_second": 9625.637, "eval_steps_per_second": 154.01, "step": 400 }, { "epoch": 1.68, "learning_rate": 1.82688927943761e-05, "loss": 0.3443, "step": 500 }, { "epoch": 2.02, "learning_rate": 1.563268892794376e-05, "loss": 0.33, "step": 600 }, { "epoch": 2.02, "eval_accuracy": 0.824, "eval_f1": 0.8239746523499383, "eval_loss": 0.39216598868370056, "eval_matthews_correlation": 0.6479558982194922, "eval_precision": 0.8239935027265344, "eval_recall": 0.8239623962396239, "eval_runtime": 0.1031, "eval_samples_per_second": 9696.512, "eval_steps_per_second": 155.144, "step": 600 }, { "epoch": 2.36, "learning_rate": 1.2996485061511423e-05, "loss": 0.227, "step": 700 }, { "epoch": 2.69, "learning_rate": 1.0360281195079087e-05, "loss": 0.2219, "step": 800 }, { "epoch": 2.69, "eval_accuracy": 0.838, "eval_f1": 0.8379766686402841, "eval_loss": 0.4026987850666046, "eval_matthews_correlation": 0.6767651028795362, "eval_precision": 0.8385613769517563, "eval_recall": 0.8382038203820381, "eval_runtime": 0.1026, "eval_samples_per_second": 9746.534, "eval_steps_per_second": 155.945, "step": 800 }, { "epoch": 3.03, "learning_rate": 7.724077328646749e-06, "loss": 0.2121, "step": 900 }, { "epoch": 3.37, "learning_rate": 5.087873462214412e-06, "loss": 0.1388, "step": 1000 }, { "epoch": 3.37, "eval_accuracy": 0.857, "eval_f1": 0.8566558306493891, "eval_loss": 0.393052339553833, "eval_matthews_correlation": 0.7159331394438886, "eval_precision": 0.859342750257998, "eval_recall": 0.8565956595659566, "eval_runtime": 0.1036, "eval_samples_per_second": 9656.574, "eval_steps_per_second": 154.505, "step": 1000 }, { "epoch": 3.7, "learning_rate": 2.4516695957820737e-06, "loss": 0.1394, "step": 1100 }, { "epoch": 4.0, "step": 1188, "total_flos": 152279543808000.0, "train_loss": 0.30630172623528373, "train_runtime": 38.7189, "train_samples_per_second": 1962.866, "train_steps_per_second": 30.683 } ], "max_steps": 1188, "num_train_epochs": 4, "total_flos": 152279543808000.0, "trial_name": null, "trial_params": null }