{ "best_metric": 1.6099027395248413, "best_model_checkpoint": "gemstones_image_detection/checkpoint-4779", "epoch": 59.0, "eval_steps": 500, "global_step": 4779, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.06521739130434782, "eval_loss": 4.402697563171387, "eval_runtime": 7.0526, "eval_samples_per_second": 91.314, "eval_steps_per_second": 11.485, "step": 81 }, { "epoch": 2.0, "eval_accuracy": 0.2329192546583851, "eval_loss": 4.283246994018555, "eval_runtime": 6.9117, "eval_samples_per_second": 93.176, "eval_steps_per_second": 11.719, "step": 162 }, { "epoch": 3.0, "eval_accuracy": 0.38354037267080743, "eval_loss": 4.158541202545166, "eval_runtime": 7.0269, "eval_samples_per_second": 91.648, "eval_steps_per_second": 11.527, "step": 243 }, { "epoch": 4.0, "eval_accuracy": 0.5139751552795031, "eval_loss": 4.027233123779297, "eval_runtime": 6.9926, "eval_samples_per_second": 92.098, "eval_steps_per_second": 11.584, "step": 324 }, { "epoch": 5.0, "eval_accuracy": 0.6024844720496895, "eval_loss": 3.892688035964966, "eval_runtime": 7.1602, "eval_samples_per_second": 89.942, "eval_steps_per_second": 11.313, "step": 405 }, { "epoch": 6.0, "eval_accuracy": 0.65527950310559, "eval_loss": 3.7535414695739746, "eval_runtime": 7.0085, "eval_samples_per_second": 91.888, "eval_steps_per_second": 11.557, "step": 486 }, { "epoch": 6.17, "learning_rate": 9.064449064449066e-06, "loss": 4.0521, "step": 500 }, { "epoch": 7.0, "eval_accuracy": 0.6816770186335404, "eval_loss": 3.6245224475860596, "eval_runtime": 6.9342, "eval_samples_per_second": 92.873, "eval_steps_per_second": 11.681, "step": 567 }, { "epoch": 8.0, "eval_accuracy": 0.7065217391304348, "eval_loss": 3.5059802532196045, "eval_runtime": 6.9825, "eval_samples_per_second": 92.231, "eval_steps_per_second": 11.6, "step": 648 }, { "epoch": 9.0, "eval_accuracy": 0.7251552795031055, "eval_loss": 3.3893799781799316, "eval_runtime": 7.0313, "eval_samples_per_second": 91.59, "eval_steps_per_second": 11.52, "step": 729 }, { "epoch": 10.0, "eval_accuracy": 0.7468944099378882, "eval_loss": 3.2792539596557617, "eval_runtime": 6.9072, "eval_samples_per_second": 93.236, "eval_steps_per_second": 11.727, "step": 810 }, { "epoch": 11.0, "eval_accuracy": 0.7593167701863354, "eval_loss": 3.185778856277466, "eval_runtime": 7.1843, "eval_samples_per_second": 89.64, "eval_steps_per_second": 11.275, "step": 891 }, { "epoch": 12.0, "eval_accuracy": 0.765527950310559, "eval_loss": 3.093205690383911, "eval_runtime": 7.203, "eval_samples_per_second": 89.407, "eval_steps_per_second": 11.245, "step": 972 }, { "epoch": 12.35, "learning_rate": 8.024948024948025e-06, "loss": 3.1602, "step": 1000 }, { "epoch": 13.0, "eval_accuracy": 0.7639751552795031, "eval_loss": 3.006822347640991, "eval_runtime": 6.9935, "eval_samples_per_second": 92.086, "eval_steps_per_second": 11.582, "step": 1053 }, { "epoch": 14.0, "eval_accuracy": 0.7701863354037267, "eval_loss": 2.9287173748016357, "eval_runtime": 6.8243, "eval_samples_per_second": 94.369, "eval_steps_per_second": 11.869, "step": 1134 }, { "epoch": 15.0, "eval_accuracy": 0.7763975155279503, "eval_loss": 2.8492088317871094, "eval_runtime": 6.9345, "eval_samples_per_second": 92.869, "eval_steps_per_second": 11.681, "step": 1215 }, { "epoch": 16.0, "eval_accuracy": 0.7763975155279503, "eval_loss": 2.779766082763672, "eval_runtime": 7.4706, "eval_samples_per_second": 86.204, "eval_steps_per_second": 10.842, "step": 1296 }, { "epoch": 17.0, "eval_accuracy": 0.782608695652174, "eval_loss": 2.71138858795166, "eval_runtime": 7.6693, "eval_samples_per_second": 83.971, "eval_steps_per_second": 10.562, "step": 1377 }, { "epoch": 18.0, "eval_accuracy": 0.7857142857142857, "eval_loss": 2.64682674407959, "eval_runtime": 7.4341, "eval_samples_per_second": 86.628, "eval_steps_per_second": 10.896, "step": 1458 }, { "epoch": 18.52, "learning_rate": 6.985446985446987e-06, "loss": 2.537, "step": 1500 }, { "epoch": 19.0, "eval_accuracy": 0.7841614906832298, "eval_loss": 2.586892604827881, "eval_runtime": 7.0064, "eval_samples_per_second": 91.916, "eval_steps_per_second": 11.561, "step": 1539 }, { "epoch": 20.0, "eval_accuracy": 0.7888198757763976, "eval_loss": 2.533936023712158, "eval_runtime": 6.9165, "eval_samples_per_second": 93.111, "eval_steps_per_second": 11.711, "step": 1620 }, { "epoch": 21.0, "eval_accuracy": 0.7950310559006211, "eval_loss": 2.4751620292663574, "eval_runtime": 6.8444, "eval_samples_per_second": 94.092, "eval_steps_per_second": 11.835, "step": 1701 }, { "epoch": 22.0, "eval_accuracy": 0.8059006211180124, "eval_loss": 2.4239892959594727, "eval_runtime": 6.7886, "eval_samples_per_second": 94.864, "eval_steps_per_second": 11.932, "step": 1782 }, { "epoch": 23.0, "eval_accuracy": 0.8027950310559007, "eval_loss": 2.3724544048309326, "eval_runtime": 6.8741, "eval_samples_per_second": 93.685, "eval_steps_per_second": 11.783, "step": 1863 }, { "epoch": 24.0, "eval_accuracy": 0.8043478260869565, "eval_loss": 2.327075719833374, "eval_runtime": 7.4527, "eval_samples_per_second": 86.412, "eval_steps_per_second": 10.869, "step": 1944 }, { "epoch": 24.69, "learning_rate": 5.945945945945947e-06, "loss": 2.0899, "step": 2000 }, { "epoch": 25.0, "eval_accuracy": 0.8074534161490683, "eval_loss": 2.2822916507720947, "eval_runtime": 6.923, "eval_samples_per_second": 93.024, "eval_steps_per_second": 11.7, "step": 2025 }, { "epoch": 26.0, "eval_accuracy": 0.812111801242236, "eval_loss": 2.2414402961730957, "eval_runtime": 6.7582, "eval_samples_per_second": 95.292, "eval_steps_per_second": 11.985, "step": 2106 }, { "epoch": 27.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 2.198101043701172, "eval_runtime": 6.9757, "eval_samples_per_second": 92.32, "eval_steps_per_second": 11.612, "step": 2187 }, { "epoch": 28.0, "eval_accuracy": 0.812111801242236, "eval_loss": 2.158327579498291, "eval_runtime": 6.8707, "eval_samples_per_second": 93.732, "eval_steps_per_second": 11.789, "step": 2268 }, { "epoch": 29.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 2.1208977699279785, "eval_runtime": 7.0622, "eval_samples_per_second": 91.19, "eval_steps_per_second": 11.47, "step": 2349 }, { "epoch": 30.0, "eval_accuracy": 0.8198757763975155, "eval_loss": 2.086048126220703, "eval_runtime": 7.4205, "eval_samples_per_second": 86.787, "eval_steps_per_second": 10.916, "step": 2430 }, { "epoch": 30.86, "learning_rate": 4.906444906444907e-06, "loss": 1.7517, "step": 2500 }, { "epoch": 31.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 2.054029941558838, "eval_runtime": 7.2868, "eval_samples_per_second": 88.38, "eval_steps_per_second": 11.116, "step": 2511 }, { "epoch": 32.0, "eval_accuracy": 0.8214285714285714, "eval_loss": 2.0214383602142334, "eval_runtime": 6.9044, "eval_samples_per_second": 93.273, "eval_steps_per_second": 11.732, "step": 2592 }, { "epoch": 33.0, "eval_accuracy": 0.8245341614906833, "eval_loss": 1.9886717796325684, "eval_runtime": 7.0403, "eval_samples_per_second": 91.474, "eval_steps_per_second": 11.505, "step": 2673 }, { "epoch": 34.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.9592698812484741, "eval_runtime": 7.0078, "eval_samples_per_second": 91.898, "eval_steps_per_second": 11.559, "step": 2754 }, { "epoch": 35.0, "eval_accuracy": 0.8136645962732919, "eval_loss": 1.9315446615219116, "eval_runtime": 6.9305, "eval_samples_per_second": 92.922, "eval_steps_per_second": 11.687, "step": 2835 }, { "epoch": 36.0, "eval_accuracy": 0.8136645962732919, "eval_loss": 1.903202772140503, "eval_runtime": 7.1188, "eval_samples_per_second": 90.464, "eval_steps_per_second": 11.378, "step": 2916 }, { "epoch": 37.0, "eval_accuracy": 0.8214285714285714, "eval_loss": 1.8818532228469849, "eval_runtime": 7.3502, "eval_samples_per_second": 87.617, "eval_steps_per_second": 11.02, "step": 2997 }, { "epoch": 37.04, "learning_rate": 3.866943866943867e-06, "loss": 1.4983, "step": 3000 }, { "epoch": 38.0, "eval_accuracy": 0.8198757763975155, "eval_loss": 1.85394287109375, "eval_runtime": 7.066, "eval_samples_per_second": 91.141, "eval_steps_per_second": 11.463, "step": 3078 }, { "epoch": 39.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 1.8299955129623413, "eval_runtime": 6.9274, "eval_samples_per_second": 92.965, "eval_steps_per_second": 11.693, "step": 3159 }, { "epoch": 40.0, "eval_accuracy": 0.8198757763975155, "eval_loss": 1.811854362487793, "eval_runtime": 6.9595, "eval_samples_per_second": 92.536, "eval_steps_per_second": 11.639, "step": 3240 }, { "epoch": 41.0, "eval_accuracy": 0.8136645962732919, "eval_loss": 1.7893236875534058, "eval_runtime": 6.921, "eval_samples_per_second": 93.05, "eval_steps_per_second": 11.704, "step": 3321 }, { "epoch": 42.0, "eval_accuracy": 0.8214285714285714, "eval_loss": 1.7720342874526978, "eval_runtime": 6.8638, "eval_samples_per_second": 93.826, "eval_steps_per_second": 11.801, "step": 3402 }, { "epoch": 43.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.7533122301101685, "eval_runtime": 7.194, "eval_samples_per_second": 89.519, "eval_steps_per_second": 11.259, "step": 3483 }, { "epoch": 43.21, "learning_rate": 2.827442827442828e-06, "loss": 1.3099, "step": 3500 }, { "epoch": 44.0, "eval_accuracy": 0.8214285714285714, "eval_loss": 1.7392221689224243, "eval_runtime": 6.9012, "eval_samples_per_second": 93.317, "eval_steps_per_second": 11.737, "step": 3564 }, { "epoch": 45.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.71939218044281, "eval_runtime": 7.3602, "eval_samples_per_second": 87.497, "eval_steps_per_second": 11.005, "step": 3645 }, { "epoch": 46.0, "eval_accuracy": 0.8183229813664596, "eval_loss": 1.7061350345611572, "eval_runtime": 7.1127, "eval_samples_per_second": 90.542, "eval_steps_per_second": 11.388, "step": 3726 }, { "epoch": 47.0, "eval_accuracy": 0.8198757763975155, "eval_loss": 1.6922202110290527, "eval_runtime": 7.1567, "eval_samples_per_second": 89.986, "eval_steps_per_second": 11.318, "step": 3807 }, { "epoch": 48.0, "eval_accuracy": 0.8136645962732919, "eval_loss": 1.6803785562515259, "eval_runtime": 6.8048, "eval_samples_per_second": 94.64, "eval_steps_per_second": 11.903, "step": 3888 }, { "epoch": 49.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 1.6694267988204956, "eval_runtime": 7.2998, "eval_samples_per_second": 88.221, "eval_steps_per_second": 11.096, "step": 3969 }, { "epoch": 49.38, "learning_rate": 1.7879417879417881e-06, "loss": 1.1777, "step": 4000 }, { "epoch": 50.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.6600834131240845, "eval_runtime": 6.8099, "eval_samples_per_second": 94.568, "eval_steps_per_second": 11.894, "step": 4050 }, { "epoch": 51.0, "eval_accuracy": 0.8214285714285714, "eval_loss": 1.6486986875534058, "eval_runtime": 6.809, "eval_samples_per_second": 94.581, "eval_steps_per_second": 11.896, "step": 4131 }, { "epoch": 52.0, "eval_accuracy": 0.8152173913043478, "eval_loss": 1.641870379447937, "eval_runtime": 6.9774, "eval_samples_per_second": 92.297, "eval_steps_per_second": 11.609, "step": 4212 }, { "epoch": 53.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.6351778507232666, "eval_runtime": 7.0388, "eval_samples_per_second": 91.493, "eval_steps_per_second": 11.508, "step": 4293 }, { "epoch": 54.0, "eval_accuracy": 0.812111801242236, "eval_loss": 1.6281042098999023, "eval_runtime": 7.0002, "eval_samples_per_second": 91.997, "eval_steps_per_second": 11.571, "step": 4374 }, { "epoch": 55.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.6229327917099, "eval_runtime": 7.1102, "eval_samples_per_second": 90.574, "eval_steps_per_second": 11.392, "step": 4455 }, { "epoch": 55.56, "learning_rate": 7.484407484407485e-07, "loss": 1.0992, "step": 4500 }, { "epoch": 56.0, "eval_accuracy": 0.8136645962732919, "eval_loss": 1.6176931858062744, "eval_runtime": 6.9832, "eval_samples_per_second": 92.221, "eval_steps_per_second": 11.599, "step": 4536 }, { "epoch": 57.0, "eval_accuracy": 0.8183229813664596, "eval_loss": 1.6147724390029907, "eval_runtime": 6.8902, "eval_samples_per_second": 93.465, "eval_steps_per_second": 11.756, "step": 4617 }, { "epoch": 58.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.6121727228164673, "eval_runtime": 6.9785, "eval_samples_per_second": 92.283, "eval_steps_per_second": 11.607, "step": 4698 }, { "epoch": 59.0, "eval_accuracy": 0.8167701863354038, "eval_loss": 1.6099027395248413, "eval_runtime": 7.0345, "eval_samples_per_second": 91.548, "eval_steps_per_second": 11.515, "step": 4779 } ], "logging_steps": 500, "max_steps": 4860, "num_train_epochs": 60, "save_steps": 500, "total_flos": 1.1781939502129306e+19, "trial_name": null, "trial_params": null }