{ "epoch": 3.0, "num_input_tokens_seen": 55653732, "total_flos": 1.4738832163602432e+16, "train_loss": 1.7073542784139526, "train_runtime": 2504.3889, "train_samples": 248732, "train_samples_per_second": 297.955, "train_steps_per_second": 37.245, "train_tokens_per_second": 22216.164 }