{ "epoch": 0.010905601116733554, "eval_accuracy": 0.7869404549281535, "eval_loss": 0.8759388327598572, "eval_runtime": 249.4157, "eval_samples": 5564, "eval_samples_per_second": 22.308, "eval_steps_per_second": 0.088, "perplexity": 2.4011284942034856, "total_flos": 1.3069163715939533e+18, "train_loss": 1.3858390502929687, "train_runtime": 13072.5982, "train_samples": 5868487, "train_samples_per_second": 1346.745, "train_steps_per_second": 21.043 }