hubert_arabic_mdd / trainer_state.json
nrshoudi's picture
End of training
016bb93
{
"best_metric": 0.3309297263622284,
"best_model_checkpoint": "nrshoudi/hubert_arabic_mdd/checkpoint-11459",
"epoch": 20.0,
"eval_steps": 500,
"global_step": 32740,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 5e-05,
"loss": 5.6351,
"step": 1637
},
{
"epoch": 1.0,
"eval_loss": 0.7704485058784485,
"eval_per": 0.3110336379911429,
"eval_runtime": 117.9251,
"eval_samples_per_second": 6.894,
"eval_steps_per_second": 3.451,
"eval_wer": 0.3277028603424945,
"step": 1637
},
{
"epoch": 2.0,
"learning_rate": 0.0001,
"loss": 0.3646,
"step": 3274
},
{
"epoch": 2.0,
"eval_loss": 0.433285653591156,
"eval_per": 0.05403750117780081,
"eval_runtime": 117.5906,
"eval_samples_per_second": 6.914,
"eval_steps_per_second": 3.461,
"eval_wer": 0.06728570761980308,
"step": 3274
},
{
"epoch": 3.0,
"learning_rate": 9.444444444444444e-05,
"loss": 0.1587,
"step": 4911
},
{
"epoch": 3.0,
"eval_loss": 0.3875606060028076,
"eval_per": 0.05804202393291247,
"eval_runtime": 117.765,
"eval_samples_per_second": 6.904,
"eval_steps_per_second": 3.456,
"eval_wer": 0.07101861788997246,
"step": 4911
},
{
"epoch": 4.0,
"learning_rate": 8.888888888888889e-05,
"loss": 0.1105,
"step": 6548
},
{
"epoch": 4.0,
"eval_loss": 0.3607988655567169,
"eval_per": 0.05578064637708471,
"eval_runtime": 117.9127,
"eval_samples_per_second": 6.895,
"eval_steps_per_second": 3.452,
"eval_wer": 0.06695907797116327,
"step": 6548
},
{
"epoch": 5.0,
"learning_rate": 8.333333333333334e-05,
"loss": 0.0878,
"step": 8185
},
{
"epoch": 5.0,
"eval_loss": 0.3808358907699585,
"eval_per": 0.05618109865259587,
"eval_runtime": 117.5542,
"eval_samples_per_second": 6.916,
"eval_steps_per_second": 3.462,
"eval_wer": 0.06775232140357426,
"step": 8185
},
{
"epoch": 6.0,
"learning_rate": 7.777777777777778e-05,
"loss": 0.0738,
"step": 9822
},
{
"epoch": 6.0,
"eval_loss": 0.3576147258281708,
"eval_per": 0.05177612362197305,
"eval_runtime": 118.5636,
"eval_samples_per_second": 6.857,
"eval_steps_per_second": 3.433,
"eval_wer": 0.06392608837665065,
"step": 9822
},
{
"epoch": 7.0,
"learning_rate": 7.222222222222222e-05,
"loss": 0.0594,
"step": 11459
},
{
"epoch": 7.0,
"eval_loss": 0.3309297263622284,
"eval_per": 0.050810326957504946,
"eval_runtime": 117.7279,
"eval_samples_per_second": 6.906,
"eval_steps_per_second": 3.457,
"eval_wer": 0.06173300359292613,
"step": 11459
},
{
"epoch": 8.0,
"learning_rate": 6.666666666666667e-05,
"loss": 0.056,
"step": 13096
},
{
"epoch": 8.0,
"eval_loss": 0.3569846451282501,
"eval_per": 0.046711580137567134,
"eval_runtime": 118.1175,
"eval_samples_per_second": 6.883,
"eval_steps_per_second": 3.446,
"eval_wer": 0.058700013998413514,
"step": 13096
},
{
"epoch": 9.0,
"learning_rate": 6.111111111111112e-05,
"loss": 0.0478,
"step": 14733
},
{
"epoch": 9.0,
"eval_loss": 0.34502002596855164,
"eval_per": 0.04727692452652407,
"eval_runtime": 117.9103,
"eval_samples_per_second": 6.895,
"eval_steps_per_second": 3.452,
"eval_wer": 0.05832672297139657,
"step": 14733
},
{
"epoch": 10.0,
"learning_rate": 5.555555555555556e-05,
"loss": 0.0388,
"step": 16370
},
{
"epoch": 10.0,
"eval_loss": 0.3993436396121979,
"eval_per": 0.04803071704513333,
"eval_runtime": 117.7116,
"eval_samples_per_second": 6.907,
"eval_steps_per_second": 3.458,
"eval_wer": 0.05907330502543045,
"step": 16370
},
{
"epoch": 11.0,
"learning_rate": 5e-05,
"loss": 0.0378,
"step": 18007
},
{
"epoch": 11.0,
"eval_loss": 0.4171537160873413,
"eval_per": 0.0437435220955432,
"eval_runtime": 118.1365,
"eval_samples_per_second": 6.882,
"eval_steps_per_second": 3.445,
"eval_wer": 0.05501376510662125,
"step": 18007
},
{
"epoch": 12.0,
"learning_rate": 4.4444444444444447e-05,
"loss": 0.0319,
"step": 19644
},
{
"epoch": 12.0,
"eval_loss": 0.3625492751598358,
"eval_per": 0.04131725242626967,
"eval_runtime": 118.0928,
"eval_samples_per_second": 6.884,
"eval_steps_per_second": 3.446,
"eval_wer": 0.051794129998600155,
"step": 19644
},
{
"epoch": 13.0,
"learning_rate": 3.888888888888889e-05,
"loss": 0.0309,
"step": 21281
},
{
"epoch": 13.0,
"eval_loss": 0.3794006109237671,
"eval_per": 0.03919721096768115,
"eval_runtime": 118.3172,
"eval_samples_per_second": 6.871,
"eval_steps_per_second": 3.44,
"eval_wer": 0.05053427278241799,
"step": 21281
},
{
"epoch": 14.0,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.0257,
"step": 22918
},
{
"epoch": 14.0,
"eval_loss": 0.3896752893924713,
"eval_per": 0.04263638933383586,
"eval_runtime": 118.7663,
"eval_samples_per_second": 6.845,
"eval_steps_per_second": 3.427,
"eval_wer": 0.05342727824179926,
"step": 22918
},
{
"epoch": 15.0,
"learning_rate": 2.777777777777778e-05,
"loss": 0.0202,
"step": 24555
},
{
"epoch": 15.0,
"eval_loss": 0.40769127011299133,
"eval_per": 0.04042212381042118,
"eval_runtime": 118.2316,
"eval_samples_per_second": 6.876,
"eval_steps_per_second": 3.442,
"eval_wer": 0.05123419345807475,
"step": 24555
},
{
"epoch": 16.0,
"learning_rate": 2.2222222222222223e-05,
"loss": 0.0197,
"step": 26192
},
{
"epoch": 16.0,
"eval_loss": 0.38464316725730896,
"eval_per": 0.041128804296617354,
"eval_runtime": 118.9714,
"eval_samples_per_second": 6.834,
"eval_steps_per_second": 3.421,
"eval_wer": 0.05076757967430358,
"step": 26192
},
{
"epoch": 17.0,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.016,
"step": 27829
},
{
"epoch": 17.0,
"eval_loss": 0.3807629942893982,
"eval_per": 0.03910298690285499,
"eval_runtime": 118.4593,
"eval_samples_per_second": 6.863,
"eval_steps_per_second": 3.436,
"eval_wer": 0.04913443143110448,
"step": 27829
},
{
"epoch": 18.0,
"learning_rate": 1.1111111111111112e-05,
"loss": 0.0157,
"step": 29466
},
{
"epoch": 18.0,
"eval_loss": 0.4060150980949402,
"eval_per": 0.03726561763874493,
"eval_runtime": 118.2175,
"eval_samples_per_second": 6.877,
"eval_steps_per_second": 3.443,
"eval_wer": 0.047127992160888435,
"step": 29466
},
{
"epoch": 19.0,
"learning_rate": 5.555555555555556e-06,
"loss": 0.0131,
"step": 31103
},
{
"epoch": 19.0,
"eval_loss": 0.3925394117832184,
"eval_per": 0.03611137284462452,
"eval_runtime": 118.443,
"eval_samples_per_second": 6.864,
"eval_steps_per_second": 3.436,
"eval_wer": 0.04652139424198591,
"step": 31103
},
{
"epoch": 20.0,
"learning_rate": 0.0,
"loss": 0.0115,
"step": 32740
},
{
"epoch": 20.0,
"eval_loss": 0.39911746978759766,
"eval_per": 0.036252708941863755,
"eval_runtime": 118.88,
"eval_samples_per_second": 6.839,
"eval_steps_per_second": 3.424,
"eval_wer": 0.04656805562036303,
"step": 32740
},
{
"epoch": 20.0,
"step": 32740,
"total_flos": 1.0473975577487264e+19,
"train_loss": 0.3427419745201153,
"train_runtime": 19585.0411,
"train_samples_per_second": 3.342,
"train_steps_per_second": 1.672
}
],
"logging_steps": 500,
"max_steps": 32740,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 1.0473975577487264e+19,
"trial_name": null,
"trial_params": null
}