{ "epoch": 3.0, "eval_loss": 1.0790187120437622, "eval_runtime": 300.3896, "eval_samples": 22063, "eval_samples_per_second": 73.448, "eval_steps_per_second": 9.181, "perplexity": 2.941791389777784, "total_flos": 4.61198337106772e+17, "train_loss": 1.3434544682004388, "train_runtime": 53992.4682, "train_samples": 250048, "train_samples_per_second": 13.893, "train_steps_per_second": 0.217 }