{ | |
"epoch": 3.0, | |
"eval_loss": 0.9653898477554321, | |
"eval_runtime": 372.5365, | |
"eval_samples": 27783, | |
"eval_samples_per_second": 74.578, | |
"eval_steps_per_second": 9.323, | |
"perplexity": 2.625811123536144, | |
"total_flos": 9.222180154174341e+17, | |
"train_loss": 0.22489413543016407, | |
"train_runtime": 25369.8446, | |
"train_samples": 500096, | |
"train_samples_per_second": 59.137, | |
"train_steps_per_second": 0.924 | |
} |