{ | |
"epoch": 3.0, | |
"eval_loss": 2.435030460357666, | |
"eval_runtime": 2.5197, | |
"eval_samples": 2500, | |
"eval_samples_per_second": 992.173, | |
"eval_steps_per_second": 124.22, | |
"num_input_tokens_seen": 55653732, | |
"total_flos": 1.4738832163602432e+16, | |
"train_loss": 1.7073542784139526, | |
"train_runtime": 2504.3889, | |
"train_samples": 248732, | |
"train_samples_per_second": 297.955, | |
"train_steps_per_second": 37.245, | |
"train_tokens_per_second": 22216.164 | |
} |