wav2vec2-xls-r-1b-japanese / trainer_state.json
vumichien's picture
End of training
cd1f931
raw
history blame
12.4 kB
{
"best_metric": 0.21041299402713776,
"best_model_checkpoint": "wav2vec2-xls-r-1b-ja-dumy8/checkpoint-42000",
"epoch": 99.99831744251262,
"global_step": 44500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.37,
"learning_rate": 4.9427586206896555e-05,
"loss": 2.2896,
"step": 1500
},
{
"epoch": 3.37,
"eval_cer": 0.17672193185166804,
"eval_loss": 0.47477588057518005,
"eval_runtime": 210.4906,
"eval_samples_per_second": 17.464,
"eval_steps_per_second": 2.185,
"eval_wer": 0.4013274336283186,
"step": 1500
},
{
"epoch": 6.74,
"learning_rate": 4.770459770114943e-05,
"loss": 1.1608,
"step": 3000
},
{
"epoch": 6.74,
"eval_cer": 0.14555577958031546,
"eval_loss": 0.33504194021224976,
"eval_runtime": 209.7295,
"eval_samples_per_second": 17.527,
"eval_steps_per_second": 2.193,
"eval_wer": 0.315929203539823,
"step": 3000
},
{
"epoch": 10.11,
"learning_rate": 4.598045977011494e-05,
"loss": 1.1042,
"step": 4500
},
{
"epoch": 10.11,
"eval_cer": 0.1399956573661926,
"eval_loss": 0.31194448471069336,
"eval_runtime": 210.0423,
"eval_samples_per_second": 17.501,
"eval_steps_per_second": 2.19,
"eval_wer": 0.2970656730321379,
"step": 4500
},
{
"epoch": 13.48,
"learning_rate": 4.4257471264367814e-05,
"loss": 1.0494,
"step": 6000
},
{
"epoch": 13.48,
"eval_cer": 0.1353350807264606,
"eval_loss": 0.2974083721637726,
"eval_runtime": 209.3107,
"eval_samples_per_second": 17.562,
"eval_steps_per_second": 2.198,
"eval_wer": 0.2867489520260829,
"step": 6000
},
{
"epoch": 16.85,
"learning_rate": 4.253448275862069e-05,
"loss": 1.0061,
"step": 7500
},
{
"epoch": 16.85,
"eval_cer": 0.1299610713897979,
"eval_loss": 0.2802002429962158,
"eval_runtime": 210.2437,
"eval_samples_per_second": 17.484,
"eval_steps_per_second": 2.188,
"eval_wer": 0.2745924545877969,
"step": 7500
},
{
"epoch": 20.22,
"learning_rate": 4.0810344827586214e-05,
"loss": 0.9629,
"step": 9000
},
{
"epoch": 20.22,
"eval_cer": 0.13255889697101292,
"eval_loss": 0.2843669652938843,
"eval_runtime": 212.4442,
"eval_samples_per_second": 17.303,
"eval_steps_per_second": 2.165,
"eval_wer": 0.2776432231020028,
"step": 9000
},
{
"epoch": 23.59,
"learning_rate": 3.908735632183908e-05,
"loss": 0.9267,
"step": 10500
},
{
"epoch": 23.59,
"eval_cer": 0.12550211703398112,
"eval_loss": 0.2576734721660614,
"eval_runtime": 210.3131,
"eval_samples_per_second": 17.479,
"eval_steps_per_second": 2.187,
"eval_wer": 0.2603400093153237,
"step": 10500
},
{
"epoch": 26.96,
"learning_rate": 3.73632183908046e-05,
"loss": 0.8984,
"step": 12000
},
{
"epoch": 26.96,
"eval_cer": 0.12256308451075577,
"eval_loss": 0.2508338689804077,
"eval_runtime": 209.2521,
"eval_samples_per_second": 17.567,
"eval_steps_per_second": 2.198,
"eval_wer": 0.2530740568234746,
"step": 12000
},
{
"epoch": 30.34,
"learning_rate": 3.564022988505747e-05,
"loss": 0.8729,
"step": 13500
},
{
"epoch": 30.34,
"eval_cer": 0.12540906059525103,
"eval_loss": 0.26286962628364563,
"eval_runtime": 208.7235,
"eval_samples_per_second": 17.612,
"eval_steps_per_second": 2.204,
"eval_wer": 0.2605728924080112,
"step": 13500
},
{
"epoch": 33.71,
"learning_rate": 3.3917241379310346e-05,
"loss": 0.8546,
"step": 15000
},
{
"epoch": 33.71,
"eval_cer": 0.11932161856165764,
"eval_loss": 0.2401771992444992,
"eval_runtime": 208.4946,
"eval_samples_per_second": 17.631,
"eval_steps_per_second": 2.206,
"eval_wer": 0.24473684210526317,
"step": 15000
},
{
"epoch": 37.08,
"learning_rate": 3.219310344827586e-05,
"loss": 0.8304,
"step": 16500
},
{
"epoch": 37.08,
"eval_cer": 0.12086480450393164,
"eval_loss": 0.25319021940231323,
"eval_runtime": 209.1002,
"eval_samples_per_second": 17.58,
"eval_steps_per_second": 2.2,
"eval_wer": 0.2472286911970191,
"step": 16500
},
{
"epoch": 40.45,
"learning_rate": 3.046896551724138e-05,
"loss": 0.8075,
"step": 18000
},
{
"epoch": 40.45,
"eval_cer": 0.11977139134885308,
"eval_loss": 0.2439287155866623,
"eval_runtime": 209.0991,
"eval_samples_per_second": 17.58,
"eval_steps_per_second": 2.2,
"eval_wer": 0.2468793665579879,
"step": 18000
},
{
"epoch": 43.82,
"learning_rate": 2.8747126436781612e-05,
"loss": 0.7827,
"step": 19500
},
{
"epoch": 43.82,
"eval_cer": 0.11672379298044264,
"eval_loss": 0.23866486549377441,
"eval_runtime": 208.9618,
"eval_samples_per_second": 17.592,
"eval_steps_per_second": 2.201,
"eval_wer": 0.23721471821145784,
"step": 19500
},
{
"epoch": 47.19,
"learning_rate": 2.7022988505747126e-05,
"loss": 0.7627,
"step": 21000
},
{
"epoch": 47.19,
"eval_cer": 0.11469981543806318,
"eval_loss": 0.23443765938282013,
"eval_runtime": 209.1358,
"eval_samples_per_second": 17.577,
"eval_steps_per_second": 2.2,
"eval_wer": 0.23306939916162087,
"step": 21000
},
{
"epoch": 50.56,
"learning_rate": 2.5300000000000002e-05,
"loss": 0.7402,
"step": 22500
},
{
"epoch": 50.56,
"eval_cer": 0.11345906292166198,
"eval_loss": 0.23135580122470856,
"eval_runtime": 210.5917,
"eval_samples_per_second": 17.456,
"eval_steps_per_second": 2.184,
"eval_wer": 0.22994876571960876,
"step": 22500
},
{
"epoch": 53.93,
"learning_rate": 2.357586206896552e-05,
"loss": 0.718,
"step": 24000
},
{
"epoch": 53.93,
"eval_cer": 0.1114040665663725,
"eval_loss": 0.22568760812282562,
"eval_runtime": 208.402,
"eval_samples_per_second": 17.639,
"eval_steps_per_second": 2.207,
"eval_wer": 0.22666511411271542,
"step": 24000
},
{
"epoch": 57.3,
"learning_rate": 2.1851724137931033e-05,
"loss": 0.7016,
"step": 25500
},
{
"epoch": 57.3,
"eval_cer": 0.10889929742388758,
"eval_loss": 0.22044427692890167,
"eval_runtime": 208.5673,
"eval_samples_per_second": 17.625,
"eval_steps_per_second": 2.206,
"eval_wer": 0.2183977643223102,
"step": 25500
},
{
"epoch": 60.67,
"learning_rate": 2.012873563218391e-05,
"loss": 0.6804,
"step": 27000
},
{
"epoch": 60.67,
"eval_cer": 0.10851931696573971,
"eval_loss": 0.22273367643356323,
"eval_runtime": 208.2294,
"eval_samples_per_second": 17.654,
"eval_steps_per_second": 2.209,
"eval_wer": 0.21811830461108522,
"step": 27000
},
{
"epoch": 64.04,
"learning_rate": 1.8405747126436782e-05,
"loss": 0.6625,
"step": 28500
},
{
"epoch": 64.04,
"eval_cer": 0.10578966142965708,
"eval_loss": 0.21378228068351746,
"eval_runtime": 209.3597,
"eval_samples_per_second": 17.558,
"eval_steps_per_second": 2.197,
"eval_wer": 0.21115510013972985,
"step": 28500
},
{
"epoch": 67.42,
"learning_rate": 1.66816091954023e-05,
"loss": 0.6465,
"step": 30000
},
{
"epoch": 67.42,
"eval_cer": 0.10442483366161577,
"eval_loss": 0.2140830010175705,
"eval_runtime": 208.6345,
"eval_samples_per_second": 17.619,
"eval_steps_per_second": 2.205,
"eval_wer": 0.20808104331625524,
"step": 30000
},
{
"epoch": 70.79,
"learning_rate": 1.4958620689655173e-05,
"loss": 0.6238,
"step": 31500
},
{
"epoch": 70.79,
"eval_cer": 0.1049754175907688,
"eval_loss": 0.21720194816589355,
"eval_runtime": 210.4781,
"eval_samples_per_second": 17.465,
"eval_steps_per_second": 2.186,
"eval_wer": 0.2082207731718677,
"step": 31500
},
{
"epoch": 74.16,
"learning_rate": 1.323448275862069e-05,
"loss": 0.6062,
"step": 33000
},
{
"epoch": 74.16,
"eval_cer": 0.10427749430029312,
"eval_loss": 0.2174130082130432,
"eval_runtime": 209.3158,
"eval_samples_per_second": 17.562,
"eval_steps_per_second": 2.198,
"eval_wer": 0.20582207731718677,
"step": 33000
},
{
"epoch": 77.53,
"learning_rate": 1.1510344827586207e-05,
"loss": 0.588,
"step": 34500
},
{
"epoch": 77.53,
"eval_cer": 0.1026955348418816,
"eval_loss": 0.21560049057006836,
"eval_runtime": 208.8439,
"eval_samples_per_second": 17.602,
"eval_steps_per_second": 2.203,
"eval_wer": 0.20344666977177456,
"step": 34500
},
{
"epoch": 80.9,
"learning_rate": 9.786206896551724e-06,
"loss": 0.5722,
"step": 36000
},
{
"epoch": 80.9,
"eval_cer": 0.10293593064193433,
"eval_loss": 0.21624404191970825,
"eval_runtime": 208.6816,
"eval_samples_per_second": 17.615,
"eval_steps_per_second": 2.204,
"eval_wer": 0.2032137866790871,
"step": 36000
},
{
"epoch": 84.27,
"learning_rate": 8.064367816091953e-06,
"loss": 0.5585,
"step": 37500
},
{
"epoch": 84.27,
"eval_cer": 0.10209066799013601,
"eval_loss": 0.21560421586036682,
"eval_runtime": 211.1243,
"eval_samples_per_second": 17.412,
"eval_steps_per_second": 2.179,
"eval_wer": 0.20216581276199347,
"step": 37500
},
{
"epoch": 87.64,
"learning_rate": 6.341379310344828e-06,
"loss": 0.5456,
"step": 39000
},
{
"epoch": 87.64,
"eval_cer": 0.10090419839632737,
"eval_loss": 0.21256230771541595,
"eval_runtime": 208.9966,
"eval_samples_per_second": 17.589,
"eval_steps_per_second": 2.201,
"eval_wer": 0.19930135072193758,
"step": 39000
},
{
"epoch": 91.01,
"learning_rate": 4.618390804597701e-06,
"loss": 0.5325,
"step": 40500
},
{
"epoch": 91.01,
"eval_cer": 0.10033810506071933,
"eval_loss": 0.2121460884809494,
"eval_runtime": 208.4119,
"eval_samples_per_second": 17.638,
"eval_steps_per_second": 2.207,
"eval_wer": 0.19659990684676293,
"step": 40500
},
{
"epoch": 94.38,
"learning_rate": 2.8942528735632185e-06,
"loss": 0.5229,
"step": 42000
},
{
"epoch": 94.38,
"eval_cer": 0.09914388076368318,
"eval_loss": 0.21041299402713776,
"eval_runtime": 208.604,
"eval_samples_per_second": 17.622,
"eval_steps_per_second": 2.205,
"eval_wer": 0.19410805775500697,
"step": 42000
},
{
"epoch": 97.75,
"learning_rate": 1.1701149425287358e-06,
"loss": 0.5134,
"step": 43500
},
{
"epoch": 97.75,
"eval_cer": 0.0991593901701382,
"eval_loss": 0.21077032387256622,
"eval_runtime": 208.8814,
"eval_samples_per_second": 17.599,
"eval_steps_per_second": 2.202,
"eval_wer": 0.19482999534233814,
"step": 43500
},
{
"epoch": 100.0,
"step": 44500,
"total_flos": 1.4850172866055105e+21,
"train_loss": 0.804292679347349,
"train_runtime": 300809.9995,
"train_samples_per_second": 9.48,
"train_steps_per_second": 0.148
}
],
"max_steps": 44500,
"num_train_epochs": 100,
"total_flos": 1.4850172866055105e+21,
"trial_name": null,
"trial_params": null
}