SmolLM2-360M-sft / all_results.json
wassname's picture
End of training
f0a6d5f verified
raw
history blame
449 Bytes
{
"epoch": 3.0,
"eval_loss": 1.4015671014785767,
"eval_model_preparation_time": 0.0049,
"eval_runtime": 340.7516,
"eval_samples": 13188,
"eval_samples_per_second": 38.703,
"eval_steps_per_second": 2.421,
"total_flos": 7.533943292711404e+17,
"train_loss": 1.4212341141200129,
"train_runtime": 13229.3679,
"train_samples": 117772,
"train_samples_per_second": 14.73,
"train_steps_per_second": 0.058
}