epoch = 5.0 train_loss = 1.4089593235308369 train_runtime = 87255.1901 train_samples_per_second = 1665.125 train_steps_per_second = 13.009