chessgpt2-medium-m / all_results.json
dakwi's picture
End of training
9d03e12 verified
raw
history blame contribute delete
445 Bytes
{
"epoch": 3.0,
"eval_loss": 0.9653898477554321,
"eval_runtime": 372.5365,
"eval_samples": 27783,
"eval_samples_per_second": 74.578,
"eval_steps_per_second": 9.323,
"perplexity": 2.625811123536144,
"total_flos": 9.222180154174341e+17,
"train_loss": 0.22489413543016407,
"train_runtime": 25369.8446,
"train_samples": 500096,
"train_samples_per_second": 59.137,
"train_steps_per_second": 0.924
}