{ "total_flos": 1.5047606448160768e+16, "train_loss": 0.3481092903137207, "train_runtime": 972.7733, "train_samples": 5000, "train_samples_per_second": 5.14, "train_steps_per_second": 0.642 }