{ "epoch": 0.9996830427892235, "eval_loss": 0.25049829483032227, "eval_runtime": 874.704, "eval_samples": 4000, "eval_samples_per_second": 4.573, "eval_steps_per_second": 0.572, "total_flos": 8013042675351552.0, "train_loss": 0.3010184336819827, "train_runtime": 18281.3669, "train_samples": 25239, "train_samples_per_second": 1.381, "train_steps_per_second": 0.086 }