gpt2-larger-walser / all_results.json
Jonas
walser larger commit
01c3411
{
"epoch": 5.0,
"eval_accuracy": 0.27604251159501675,
"eval_loss": 4.173768997192383,
"eval_runtime": 4.8911,
"eval_samples": 235,
"eval_samples_per_second": 48.047,
"eval_steps_per_second": 6.134,
"perplexity": 64.9598246952154,
"train_loss": 4.937346829501065,
"train_runtime": 481.6631,
"train_samples": 1755,
"train_samples_per_second": 18.218,
"train_steps_per_second": 1.142
}