Qwen3-0.6B-sft-4chan / all_results.json
wassname's picture
End of training
408be0d verified
{
"base_eval_samples": 10000,
"epoch": 3.0,
"eval_loss": 2.3705878257751465,
"eval_model_preparation_time": 0.0052,
"eval_runtime": 439.9764,
"eval_samples": 18272,
"eval_samples_per_second": 22.728,
"eval_steps_per_second": 1.421,
"total_flos": 6.89082454341845e+17,
"train_loss": 0.0,
"train_runtime": 1.3308,
"train_samples": 74558,
"train_samples_per_second": 95664.35,
"train_steps_per_second": 374.2
}