{ "epoch": 3.0, "eval_loss": 0.9653898477554321, "eval_runtime": 372.5365, "eval_samples": 27783, "eval_samples_per_second": 74.578, "eval_steps_per_second": 9.323, "perplexity": 2.625811123536144, "total_flos": 9.222180154174341e+17, "train_loss": 0.22489413543016407, "train_runtime": 25369.8446, "train_samples": 500096, "train_samples_per_second": 59.137, "train_steps_per_second": 0.924 }