{ | |
"epoch": 3.0, | |
"eval_loss": 1.0790187120437622, | |
"eval_runtime": 300.3896, | |
"eval_samples": 22063, | |
"eval_samples_per_second": 73.448, | |
"eval_steps_per_second": 9.181, | |
"perplexity": 2.941791389777784, | |
"total_flos": 4.61198337106772e+17, | |
"train_loss": 1.3434544682004388, | |
"train_runtime": 53992.4682, | |
"train_samples": 250048, | |
"train_samples_per_second": 13.893, | |
"train_steps_per_second": 0.217 | |
} |