{ | |
"epoch": 9.321127579192096, | |
"eval_accuracy": 0.3345458864628659, | |
"eval_loss": 3.945629119873047, | |
"eval_runtime": 233.188, | |
"eval_samples": 33767, | |
"eval_samples_per_second": 144.806, | |
"eval_steps_per_second": 1.51, | |
"perplexity": 51.70885895206038, | |
"total_flos": 5.363892569191219e+17, | |
"train_loss": 4.763968430426513, | |
"train_runtime": 93599.1484, | |
"train_samples": 660643, | |
"train_samples_per_second": 705.822, | |
"train_steps_per_second": 7.353 | |
} |