{ "epoch": 9.321127579192096, "eval_accuracy": 0.3345458864628659, "eval_loss": 3.945629119873047, "eval_runtime": 233.188, "eval_samples": 33767, "eval_samples_per_second": 144.806, "eval_steps_per_second": 1.51, "perplexity": 51.70885895206038, "total_flos": 5.363892569191219e+17, "train_loss": 4.763968430426513, "train_runtime": 93599.1484, "train_samples": 660643, "train_samples_per_second": 705.822, "train_steps_per_second": 7.353 }