XLSR_Paiwan / trainer_state.json
eleferrand's picture
Upload 10 files
76a7548 verified
{
"best_metric": 0.15105250983113577,
"best_model_checkpoint": "xlsr_Paiwan/checkpoint-19740",
"epoch": 30.0,
"global_step": 19740,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.76,
"learning_rate": 0.0002924620060790273,
"loss": 2.0437,
"step": 500
},
{
"epoch": 1.0,
"eval_loss": 0.43691062927246094,
"eval_runtime": 54.5716,
"eval_samples_per_second": 54.79,
"eval_steps_per_second": 6.853,
"eval_wer": 0.57050328806054,
"step": 658
},
{
"epoch": 1.52,
"learning_rate": 0.00028486322188449846,
"loss": 0.4605,
"step": 1000
},
{
"epoch": 2.0,
"eval_loss": 0.3218730688095093,
"eval_runtime": 53.5979,
"eval_samples_per_second": 55.786,
"eval_steps_per_second": 6.978,
"eval_wer": 0.424407653415287,
"step": 1316
},
{
"epoch": 2.28,
"learning_rate": 0.0002772644376899696,
"loss": 0.3486,
"step": 1500
},
{
"epoch": 3.0,
"eval_loss": 0.2743721604347229,
"eval_runtime": 52.9623,
"eval_samples_per_second": 56.455,
"eval_steps_per_second": 7.062,
"eval_wer": 0.3111265325005783,
"step": 1974
},
{
"epoch": 3.04,
"learning_rate": 0.0002696656534954407,
"loss": 0.3005,
"step": 2000
},
{
"epoch": 3.8,
"learning_rate": 0.00026206686930091183,
"loss": 0.243,
"step": 2500
},
{
"epoch": 4.0,
"eval_loss": 0.2703934609889984,
"eval_runtime": 52.6582,
"eval_samples_per_second": 56.781,
"eval_steps_per_second": 7.102,
"eval_wer": 0.3132745117477942,
"step": 2632
},
{
"epoch": 4.56,
"learning_rate": 0.000254468085106383,
"loss": 0.2074,
"step": 3000
},
{
"epoch": 5.0,
"eval_loss": 0.2540125250816345,
"eval_runtime": 51.8815,
"eval_samples_per_second": 57.631,
"eval_steps_per_second": 7.209,
"eval_wer": 0.29308350682396483,
"step": 3290
},
{
"epoch": 5.32,
"learning_rate": 0.0002468693009118541,
"loss": 0.1827,
"step": 3500
},
{
"epoch": 6.0,
"eval_loss": 0.24963043630123138,
"eval_runtime": 52.0611,
"eval_samples_per_second": 57.433,
"eval_steps_per_second": 7.184,
"eval_wer": 0.24047453818446185,
"step": 3948
},
{
"epoch": 6.08,
"learning_rate": 0.0002392705167173252,
"loss": 0.1649,
"step": 4000
},
{
"epoch": 6.84,
"learning_rate": 0.00023167173252279633,
"loss": 0.1371,
"step": 4500
},
{
"epoch": 7.0,
"eval_loss": 0.24666966497898102,
"eval_runtime": 52.0071,
"eval_samples_per_second": 57.492,
"eval_steps_per_second": 7.191,
"eval_wer": 0.23730213806549685,
"step": 4606
},
{
"epoch": 7.6,
"learning_rate": 0.00022407294832826744,
"loss": 0.1258,
"step": 5000
},
{
"epoch": 8.0,
"eval_loss": 0.25583532452583313,
"eval_runtime": 52.0669,
"eval_samples_per_second": 57.426,
"eval_steps_per_second": 7.183,
"eval_wer": 0.22309242919929942,
"step": 5264
},
{
"epoch": 8.36,
"learning_rate": 0.00021647416413373858,
"loss": 0.1078,
"step": 5500
},
{
"epoch": 9.0,
"eval_loss": 0.2600269019603729,
"eval_runtime": 52.0714,
"eval_samples_per_second": 57.421,
"eval_steps_per_second": 7.182,
"eval_wer": 0.213310862165824,
"step": 5922
},
{
"epoch": 9.12,
"learning_rate": 0.00020887537993920973,
"loss": 0.1038,
"step": 6000
},
{
"epoch": 9.88,
"learning_rate": 0.00020127659574468082,
"loss": 0.0906,
"step": 6500
},
{
"epoch": 10.0,
"eval_loss": 0.25083455443382263,
"eval_runtime": 52.0294,
"eval_samples_per_second": 57.467,
"eval_steps_per_second": 7.188,
"eval_wer": 0.20997323287399625,
"step": 6580
},
{
"epoch": 10.64,
"learning_rate": 0.00019367781155015196,
"loss": 0.0843,
"step": 7000
},
{
"epoch": 11.0,
"eval_loss": 0.2840941548347473,
"eval_runtime": 52.1825,
"eval_samples_per_second": 57.299,
"eval_steps_per_second": 7.167,
"eval_wer": 0.19976206999107762,
"step": 7238
},
{
"epoch": 11.4,
"learning_rate": 0.0001860790273556231,
"loss": 0.0765,
"step": 7500
},
{
"epoch": 12.0,
"eval_loss": 0.26433253288269043,
"eval_runtime": 52.2172,
"eval_samples_per_second": 57.261,
"eval_steps_per_second": 7.162,
"eval_wer": 0.19328508641485742,
"step": 7896
},
{
"epoch": 12.16,
"learning_rate": 0.00017848024316109422,
"loss": 0.0699,
"step": 8000
},
{
"epoch": 12.92,
"learning_rate": 0.00017088145896656533,
"loss": 0.0671,
"step": 8500
},
{
"epoch": 13.0,
"eval_loss": 0.2808719873428345,
"eval_runtime": 52.2538,
"eval_samples_per_second": 57.221,
"eval_steps_per_second": 7.157,
"eval_wer": 0.18816298205611182,
"step": 8554
},
{
"epoch": 13.68,
"learning_rate": 0.00016329787234042553,
"loss": 0.0589,
"step": 9000
},
{
"epoch": 14.0,
"eval_loss": 0.2795076072216034,
"eval_runtime": 52.106,
"eval_samples_per_second": 57.383,
"eval_steps_per_second": 7.178,
"eval_wer": 0.18647764449291168,
"step": 9212
},
{
"epoch": 14.44,
"learning_rate": 0.00015569908814589664,
"loss": 0.0566,
"step": 9500
},
{
"epoch": 15.0,
"eval_loss": 0.27890855073928833,
"eval_runtime": 52.1531,
"eval_samples_per_second": 57.331,
"eval_steps_per_second": 7.171,
"eval_wer": 0.18158686097617396,
"step": 9870
},
{
"epoch": 15.2,
"learning_rate": 0.00014810030395136776,
"loss": 0.0514,
"step": 10000
},
{
"epoch": 15.96,
"learning_rate": 0.0001405015197568389,
"loss": 0.0507,
"step": 10500
},
{
"epoch": 16.0,
"eval_loss": 0.28275853395462036,
"eval_runtime": 52.1154,
"eval_samples_per_second": 57.373,
"eval_steps_per_second": 7.176,
"eval_wer": 0.17676216912858134,
"step": 10528
},
{
"epoch": 16.72,
"learning_rate": 0.00013291793313069907,
"loss": 0.0452,
"step": 11000
},
{
"epoch": 17.0,
"eval_loss": 0.2956693470478058,
"eval_runtime": 56.2891,
"eval_samples_per_second": 53.119,
"eval_steps_per_second": 6.644,
"eval_wer": 0.1839661610653977,
"step": 11186
},
{
"epoch": 17.48,
"learning_rate": 0.0001253191489361702,
"loss": 0.0414,
"step": 11500
},
{
"epoch": 18.0,
"eval_loss": 0.272775262594223,
"eval_runtime": 52.2587,
"eval_samples_per_second": 57.215,
"eval_steps_per_second": 7.157,
"eval_wer": 0.17431677737021248,
"step": 11844
},
{
"epoch": 18.24,
"learning_rate": 0.00011772036474164133,
"loss": 0.0373,
"step": 12000
},
{
"epoch": 19.0,
"learning_rate": 0.00011012158054711246,
"loss": 0.0362,
"step": 12500
},
{
"epoch": 19.0,
"eval_loss": 0.2982702851295471,
"eval_runtime": 52.2158,
"eval_samples_per_second": 57.262,
"eval_steps_per_second": 7.163,
"eval_wer": 0.17220184395756916,
"step": 12502
},
{
"epoch": 19.76,
"learning_rate": 0.00010252279635258359,
"loss": 0.0348,
"step": 13000
},
{
"epoch": 20.0,
"eval_loss": 0.2988567054271698,
"eval_runtime": 52.245,
"eval_samples_per_second": 57.23,
"eval_steps_per_second": 7.159,
"eval_wer": 0.1638082019761409,
"step": 13160
},
{
"epoch": 20.52,
"learning_rate": 9.493920972644377e-05,
"loss": 0.0324,
"step": 13500
},
{
"epoch": 21.0,
"eval_loss": 0.3093124032020569,
"eval_runtime": 52.8274,
"eval_samples_per_second": 56.599,
"eval_steps_per_second": 7.08,
"eval_wer": 0.16509698952447044,
"step": 13818
},
{
"epoch": 21.28,
"learning_rate": 8.734042553191488e-05,
"loss": 0.0303,
"step": 14000
},
{
"epoch": 22.0,
"eval_loss": 0.3057407736778259,
"eval_runtime": 52.5941,
"eval_samples_per_second": 56.851,
"eval_steps_per_second": 7.111,
"eval_wer": 0.16489871451703514,
"step": 14476
},
{
"epoch": 22.04,
"learning_rate": 7.974164133738601e-05,
"loss": 0.0293,
"step": 14500
},
{
"epoch": 22.8,
"learning_rate": 7.214285714285714e-05,
"loss": 0.0267,
"step": 15000
},
{
"epoch": 23.0,
"eval_loss": 0.3179123103618622,
"eval_runtime": 52.2627,
"eval_samples_per_second": 57.211,
"eval_steps_per_second": 7.156,
"eval_wer": 0.1582895476025247,
"step": 15134
},
{
"epoch": 23.56,
"learning_rate": 6.455927051671732e-05,
"loss": 0.026,
"step": 15500
},
{
"epoch": 24.0,
"eval_loss": 0.3296581506729126,
"eval_runtime": 52.0664,
"eval_samples_per_second": 57.427,
"eval_steps_per_second": 7.183,
"eval_wer": 0.15799213509137172,
"step": 15792
},
{
"epoch": 24.32,
"learning_rate": 5.696048632218844e-05,
"loss": 0.0246,
"step": 16000
},
{
"epoch": 25.0,
"eval_loss": 0.3182116746902466,
"eval_runtime": 51.9316,
"eval_samples_per_second": 57.576,
"eval_steps_per_second": 7.202,
"eval_wer": 0.15541455999471265,
"step": 16450
},
{
"epoch": 25.08,
"learning_rate": 4.937689969604863e-05,
"loss": 0.0235,
"step": 16500
},
{
"epoch": 25.84,
"learning_rate": 4.179331306990881e-05,
"loss": 0.0215,
"step": 17000
},
{
"epoch": 26.0,
"eval_loss": 0.3294830620288849,
"eval_runtime": 52.2884,
"eval_samples_per_second": 57.183,
"eval_steps_per_second": 7.153,
"eval_wer": 0.15541455999471265,
"step": 17108
},
{
"epoch": 26.6,
"learning_rate": 3.419452887537994e-05,
"loss": 0.0199,
"step": 17500
},
{
"epoch": 27.0,
"eval_loss": 0.33707642555236816,
"eval_runtime": 51.7426,
"eval_samples_per_second": 57.786,
"eval_steps_per_second": 7.228,
"eval_wer": 0.1535309474240772,
"step": 17766
},
{
"epoch": 27.36,
"learning_rate": 2.6595744680851064e-05,
"loss": 0.019,
"step": 18000
},
{
"epoch": 28.0,
"eval_loss": 0.34009498357772827,
"eval_runtime": 51.768,
"eval_samples_per_second": 57.758,
"eval_steps_per_second": 7.225,
"eval_wer": 0.15174647235715938,
"step": 18424
},
{
"epoch": 28.12,
"learning_rate": 1.8996960486322186e-05,
"loss": 0.0185,
"step": 18500
},
{
"epoch": 28.88,
"learning_rate": 1.139817629179331e-05,
"loss": 0.0172,
"step": 19000
},
{
"epoch": 29.0,
"eval_loss": 0.34455737471580505,
"eval_runtime": 51.8182,
"eval_samples_per_second": 57.702,
"eval_steps_per_second": 7.218,
"eval_wer": 0.15108555566570833,
"step": 19082
},
{
"epoch": 29.64,
"learning_rate": 3.7993920972644374e-06,
"loss": 0.0166,
"step": 19500
},
{
"epoch": 30.0,
"eval_loss": 0.3466561436653137,
"eval_runtime": 51.8971,
"eval_samples_per_second": 57.614,
"eval_steps_per_second": 7.207,
"eval_wer": 0.15105250983113577,
"step": 19740
}
],
"max_steps": 19740,
"num_train_epochs": 30,
"total_flos": 7.422835365656386e+19,
"trial_name": null,
"trial_params": null
}