Whisper-Small-Kinyarwanda / trainer_state.json
Kleber's picture
Upload . with huggingface_hub
b227e33
{
"best_metric": 24.71689240755159,
"best_model_checkpoint": "output_dir_run_2/checkpoint-42000",
"epoch": 1.834423353006859,
"global_step": 46000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 4.4e-07,
"loss": 3.8256,
"step": 25
},
{
"epoch": 0.0,
"learning_rate": 9.200000000000001e-07,
"loss": 3.5128,
"step": 50
},
{
"epoch": 0.0,
"learning_rate": 1.42e-06,
"loss": 2.8953,
"step": 75
},
{
"epoch": 0.0,
"learning_rate": 1.9200000000000003e-06,
"loss": 2.3779,
"step": 100
},
{
"epoch": 0.0,
"learning_rate": 2.42e-06,
"loss": 2.065,
"step": 125
},
{
"epoch": 0.01,
"learning_rate": 2.92e-06,
"loss": 1.8663,
"step": 150
},
{
"epoch": 0.01,
"learning_rate": 3.4200000000000007e-06,
"loss": 1.6813,
"step": 175
},
{
"epoch": 0.01,
"learning_rate": 3.920000000000001e-06,
"loss": 1.6136,
"step": 200
},
{
"epoch": 0.01,
"learning_rate": 4.42e-06,
"loss": 1.5066,
"step": 225
},
{
"epoch": 0.01,
"learning_rate": 4.92e-06,
"loss": 1.3971,
"step": 250
},
{
"epoch": 0.01,
"learning_rate": 5.420000000000001e-06,
"loss": 1.3437,
"step": 275
},
{
"epoch": 0.01,
"learning_rate": 5.92e-06,
"loss": 1.2227,
"step": 300
},
{
"epoch": 0.01,
"learning_rate": 6.42e-06,
"loss": 1.2204,
"step": 325
},
{
"epoch": 0.01,
"learning_rate": 6.92e-06,
"loss": 1.1546,
"step": 350
},
{
"epoch": 0.01,
"learning_rate": 7.420000000000001e-06,
"loss": 1.1521,
"step": 375
},
{
"epoch": 0.02,
"learning_rate": 7.92e-06,
"loss": 1.0848,
"step": 400
},
{
"epoch": 0.02,
"learning_rate": 8.42e-06,
"loss": 1.0626,
"step": 425
},
{
"epoch": 0.02,
"learning_rate": 8.920000000000001e-06,
"loss": 1.0112,
"step": 450
},
{
"epoch": 0.02,
"learning_rate": 9.42e-06,
"loss": 0.988,
"step": 475
},
{
"epoch": 0.02,
"learning_rate": 9.920000000000002e-06,
"loss": 0.9656,
"step": 500
},
{
"epoch": 0.02,
"learning_rate": 9.99957957957958e-06,
"loss": 0.9418,
"step": 525
},
{
"epoch": 0.02,
"learning_rate": 9.99907907907908e-06,
"loss": 0.9225,
"step": 550
},
{
"epoch": 0.02,
"learning_rate": 9.99857857857858e-06,
"loss": 0.9479,
"step": 575
},
{
"epoch": 0.02,
"learning_rate": 9.998078078078079e-06,
"loss": 0.8927,
"step": 600
},
{
"epoch": 0.02,
"learning_rate": 9.997577577577578e-06,
"loss": 0.8688,
"step": 625
},
{
"epoch": 0.03,
"learning_rate": 9.997077077077078e-06,
"loss": 0.8846,
"step": 650
},
{
"epoch": 0.03,
"learning_rate": 9.996576576576577e-06,
"loss": 0.8514,
"step": 675
},
{
"epoch": 0.03,
"learning_rate": 9.996076076076076e-06,
"loss": 0.8254,
"step": 700
},
{
"epoch": 0.03,
"learning_rate": 9.995575575575577e-06,
"loss": 0.8167,
"step": 725
},
{
"epoch": 0.03,
"learning_rate": 9.995075075075076e-06,
"loss": 0.7695,
"step": 750
},
{
"epoch": 0.03,
"learning_rate": 9.994574574574576e-06,
"loss": 0.8109,
"step": 775
},
{
"epoch": 0.03,
"learning_rate": 9.994074074074075e-06,
"loss": 0.7718,
"step": 800
},
{
"epoch": 0.03,
"learning_rate": 9.993573573573574e-06,
"loss": 0.7937,
"step": 825
},
{
"epoch": 0.03,
"learning_rate": 9.993073073073074e-06,
"loss": 0.7566,
"step": 850
},
{
"epoch": 0.03,
"learning_rate": 9.992572572572573e-06,
"loss": 0.7627,
"step": 875
},
{
"epoch": 0.04,
"learning_rate": 9.992072072072074e-06,
"loss": 0.7564,
"step": 900
},
{
"epoch": 0.04,
"learning_rate": 9.991571571571572e-06,
"loss": 0.766,
"step": 925
},
{
"epoch": 0.04,
"learning_rate": 9.991071071071073e-06,
"loss": 0.7255,
"step": 950
},
{
"epoch": 0.04,
"learning_rate": 9.990570570570572e-06,
"loss": 0.7385,
"step": 975
},
{
"epoch": 0.04,
"learning_rate": 9.990070070070071e-06,
"loss": 0.7455,
"step": 1000
},
{
"epoch": 0.04,
"eval_loss": 0.9031199216842651,
"eval_runtime": 2867.5101,
"eval_samples_per_second": 5.654,
"eval_steps_per_second": 0.142,
"eval_wer": 58.282005226601704,
"step": 1000
},
{
"epoch": 0.04,
"learning_rate": 9.98956956956957e-06,
"loss": 0.7141,
"step": 1025
},
{
"epoch": 0.04,
"learning_rate": 9.98906906906907e-06,
"loss": 0.7036,
"step": 1050
},
{
"epoch": 0.04,
"learning_rate": 9.988568568568569e-06,
"loss": 0.7157,
"step": 1075
},
{
"epoch": 0.04,
"learning_rate": 9.988068068068068e-06,
"loss": 0.7362,
"step": 1100
},
{
"epoch": 0.04,
"learning_rate": 9.98756756756757e-06,
"loss": 0.7134,
"step": 1125
},
{
"epoch": 0.05,
"learning_rate": 9.987067067067067e-06,
"loss": 0.6704,
"step": 1150
},
{
"epoch": 0.05,
"learning_rate": 9.986566566566568e-06,
"loss": 0.6907,
"step": 1175
},
{
"epoch": 0.05,
"learning_rate": 9.986066066066067e-06,
"loss": 0.6851,
"step": 1200
},
{
"epoch": 0.05,
"learning_rate": 9.985565565565567e-06,
"loss": 0.7214,
"step": 1225
},
{
"epoch": 0.05,
"learning_rate": 9.985065065065066e-06,
"loss": 0.6876,
"step": 1250
},
{
"epoch": 0.05,
"learning_rate": 9.984564564564565e-06,
"loss": 0.6627,
"step": 1275
},
{
"epoch": 0.05,
"learning_rate": 9.984064064064064e-06,
"loss": 0.6739,
"step": 1300
},
{
"epoch": 0.05,
"learning_rate": 9.983563563563564e-06,
"loss": 0.6629,
"step": 1325
},
{
"epoch": 0.05,
"learning_rate": 9.983063063063065e-06,
"loss": 0.6493,
"step": 1350
},
{
"epoch": 0.05,
"learning_rate": 9.982562562562564e-06,
"loss": 0.6512,
"step": 1375
},
{
"epoch": 0.06,
"learning_rate": 9.982062062062063e-06,
"loss": 0.6481,
"step": 1400
},
{
"epoch": 0.06,
"learning_rate": 9.981561561561563e-06,
"loss": 0.6459,
"step": 1425
},
{
"epoch": 0.06,
"learning_rate": 9.981061061061062e-06,
"loss": 0.643,
"step": 1450
},
{
"epoch": 0.06,
"learning_rate": 9.980560560560561e-06,
"loss": 0.6344,
"step": 1475
},
{
"epoch": 0.06,
"learning_rate": 9.98006006006006e-06,
"loss": 0.6312,
"step": 1500
},
{
"epoch": 0.06,
"learning_rate": 9.979559559559561e-06,
"loss": 0.6587,
"step": 1525
},
{
"epoch": 0.06,
"learning_rate": 9.979059059059059e-06,
"loss": 0.6156,
"step": 1550
},
{
"epoch": 0.06,
"learning_rate": 9.97855855855856e-06,
"loss": 0.64,
"step": 1575
},
{
"epoch": 0.06,
"learning_rate": 9.97805805805806e-06,
"loss": 0.5947,
"step": 1600
},
{
"epoch": 0.06,
"learning_rate": 9.977557557557559e-06,
"loss": 0.6496,
"step": 1625
},
{
"epoch": 0.07,
"learning_rate": 9.977057057057058e-06,
"loss": 0.6434,
"step": 1650
},
{
"epoch": 0.07,
"learning_rate": 9.976556556556557e-06,
"loss": 0.5917,
"step": 1675
},
{
"epoch": 0.07,
"learning_rate": 9.976056056056057e-06,
"loss": 0.6057,
"step": 1700
},
{
"epoch": 0.07,
"learning_rate": 9.975555555555556e-06,
"loss": 0.6132,
"step": 1725
},
{
"epoch": 0.07,
"learning_rate": 9.975055055055057e-06,
"loss": 0.5929,
"step": 1750
},
{
"epoch": 0.07,
"learning_rate": 9.974554554554554e-06,
"loss": 0.6166,
"step": 1775
},
{
"epoch": 0.07,
"learning_rate": 9.974054054054055e-06,
"loss": 0.5866,
"step": 1800
},
{
"epoch": 0.07,
"learning_rate": 9.973553553553555e-06,
"loss": 0.6123,
"step": 1825
},
{
"epoch": 0.07,
"learning_rate": 9.973053053053054e-06,
"loss": 0.594,
"step": 1850
},
{
"epoch": 0.07,
"learning_rate": 9.972552552552553e-06,
"loss": 0.5949,
"step": 1875
},
{
"epoch": 0.08,
"learning_rate": 9.972052052052053e-06,
"loss": 0.5862,
"step": 1900
},
{
"epoch": 0.08,
"learning_rate": 9.971551551551552e-06,
"loss": 0.609,
"step": 1925
},
{
"epoch": 0.08,
"learning_rate": 9.971051051051051e-06,
"loss": 0.5688,
"step": 1950
},
{
"epoch": 0.08,
"learning_rate": 9.970550550550552e-06,
"loss": 0.592,
"step": 1975
},
{
"epoch": 0.08,
"learning_rate": 9.970050050050052e-06,
"loss": 0.5906,
"step": 2000
},
{
"epoch": 0.08,
"eval_loss": 0.7455159425735474,
"eval_runtime": 3054.18,
"eval_samples_per_second": 5.308,
"eval_steps_per_second": 0.133,
"eval_wer": 50.6001341340261,
"step": 2000
},
{
"epoch": 0.08,
"learning_rate": 9.96954954954955e-06,
"loss": 0.5755,
"step": 2025
},
{
"epoch": 0.08,
"learning_rate": 9.96904904904905e-06,
"loss": 0.5761,
"step": 2050
},
{
"epoch": 0.08,
"learning_rate": 9.96854854854855e-06,
"loss": 0.5832,
"step": 2075
},
{
"epoch": 0.08,
"learning_rate": 9.968048048048049e-06,
"loss": 0.5661,
"step": 2100
},
{
"epoch": 0.08,
"learning_rate": 9.967547547547548e-06,
"loss": 0.5906,
"step": 2125
},
{
"epoch": 0.09,
"learning_rate": 9.967047047047049e-06,
"loss": 0.5769,
"step": 2150
},
{
"epoch": 0.09,
"learning_rate": 9.966546546546547e-06,
"loss": 0.5491,
"step": 2175
},
{
"epoch": 0.09,
"learning_rate": 9.966046046046048e-06,
"loss": 0.5794,
"step": 2200
},
{
"epoch": 0.09,
"learning_rate": 9.965545545545547e-06,
"loss": 0.5319,
"step": 2225
},
{
"epoch": 0.09,
"learning_rate": 9.965045045045044e-06,
"loss": 0.5656,
"step": 2250
},
{
"epoch": 0.09,
"learning_rate": 9.964544544544545e-06,
"loss": 0.5714,
"step": 2275
},
{
"epoch": 0.09,
"learning_rate": 9.964044044044045e-06,
"loss": 0.5667,
"step": 2300
},
{
"epoch": 0.09,
"learning_rate": 9.963543543543544e-06,
"loss": 0.5628,
"step": 2325
},
{
"epoch": 0.09,
"learning_rate": 9.963043043043043e-06,
"loss": 0.5816,
"step": 2350
},
{
"epoch": 0.09,
"learning_rate": 9.962542542542544e-06,
"loss": 0.5713,
"step": 2375
},
{
"epoch": 0.1,
"learning_rate": 9.962042042042042e-06,
"loss": 0.5513,
"step": 2400
},
{
"epoch": 0.1,
"learning_rate": 9.961541541541543e-06,
"loss": 0.5416,
"step": 2425
},
{
"epoch": 0.1,
"learning_rate": 9.961041041041042e-06,
"loss": 0.5273,
"step": 2450
},
{
"epoch": 0.1,
"learning_rate": 9.960540540540542e-06,
"loss": 0.5414,
"step": 2475
},
{
"epoch": 0.1,
"learning_rate": 9.960040040040041e-06,
"loss": 0.5454,
"step": 2500
},
{
"epoch": 0.1,
"learning_rate": 9.95953953953954e-06,
"loss": 0.5335,
"step": 2525
},
{
"epoch": 0.1,
"learning_rate": 9.95903903903904e-06,
"loss": 0.538,
"step": 2550
},
{
"epoch": 0.1,
"learning_rate": 9.958538538538539e-06,
"loss": 0.5275,
"step": 2575
},
{
"epoch": 0.1,
"learning_rate": 9.95803803803804e-06,
"loss": 0.541,
"step": 2600
},
{
"epoch": 0.1,
"learning_rate": 9.957537537537539e-06,
"loss": 0.5653,
"step": 2625
},
{
"epoch": 0.11,
"learning_rate": 9.957037037037038e-06,
"loss": 0.5407,
"step": 2650
},
{
"epoch": 0.11,
"learning_rate": 9.956536536536538e-06,
"loss": 0.5508,
"step": 2675
},
{
"epoch": 0.11,
"learning_rate": 9.956036036036037e-06,
"loss": 0.507,
"step": 2700
},
{
"epoch": 0.11,
"learning_rate": 9.955535535535536e-06,
"loss": 0.5289,
"step": 2725
},
{
"epoch": 0.11,
"learning_rate": 9.955035035035036e-06,
"loss": 0.543,
"step": 2750
},
{
"epoch": 0.11,
"learning_rate": 9.954534534534537e-06,
"loss": 0.5489,
"step": 2775
},
{
"epoch": 0.11,
"learning_rate": 9.954034034034034e-06,
"loss": 0.5433,
"step": 2800
},
{
"epoch": 0.11,
"learning_rate": 9.953533533533535e-06,
"loss": 0.5372,
"step": 2825
},
{
"epoch": 0.11,
"learning_rate": 9.953033033033034e-06,
"loss": 0.5397,
"step": 2850
},
{
"epoch": 0.11,
"learning_rate": 9.952532532532532e-06,
"loss": 0.5429,
"step": 2875
},
{
"epoch": 0.12,
"learning_rate": 9.952032032032033e-06,
"loss": 0.5178,
"step": 2900
},
{
"epoch": 0.12,
"learning_rate": 9.951531531531532e-06,
"loss": 0.5426,
"step": 2925
},
{
"epoch": 0.12,
"learning_rate": 9.951031031031032e-06,
"loss": 0.5301,
"step": 2950
},
{
"epoch": 0.12,
"learning_rate": 9.950530530530531e-06,
"loss": 0.5113,
"step": 2975
},
{
"epoch": 0.12,
"learning_rate": 9.950030030030032e-06,
"loss": 0.5015,
"step": 3000
},
{
"epoch": 0.12,
"eval_loss": 0.6700246334075928,
"eval_runtime": 2829.2547,
"eval_samples_per_second": 5.73,
"eval_steps_per_second": 0.144,
"eval_wer": 45.80060283223225,
"step": 3000
},
{
"epoch": 0.12,
"learning_rate": 9.94952952952953e-06,
"loss": 0.5075,
"step": 3025
},
{
"epoch": 0.12,
"learning_rate": 9.94902902902903e-06,
"loss": 0.548,
"step": 3050
},
{
"epoch": 0.12,
"learning_rate": 9.94852852852853e-06,
"loss": 0.5221,
"step": 3075
},
{
"epoch": 0.12,
"learning_rate": 9.948028028028029e-06,
"loss": 0.5108,
"step": 3100
},
{
"epoch": 0.12,
"learning_rate": 9.947527527527528e-06,
"loss": 0.4792,
"step": 3125
},
{
"epoch": 0.13,
"learning_rate": 9.947027027027028e-06,
"loss": 0.4993,
"step": 3150
},
{
"epoch": 0.13,
"learning_rate": 9.946526526526527e-06,
"loss": 0.5159,
"step": 3175
},
{
"epoch": 0.13,
"learning_rate": 9.946026026026026e-06,
"loss": 0.4948,
"step": 3200
},
{
"epoch": 0.13,
"learning_rate": 9.945525525525527e-06,
"loss": 0.527,
"step": 3225
},
{
"epoch": 0.13,
"learning_rate": 9.945025025025027e-06,
"loss": 0.4831,
"step": 3250
},
{
"epoch": 0.13,
"learning_rate": 9.944524524524526e-06,
"loss": 0.5106,
"step": 3275
},
{
"epoch": 0.13,
"learning_rate": 9.944024024024025e-06,
"loss": 0.5323,
"step": 3300
},
{
"epoch": 0.13,
"learning_rate": 9.943523523523524e-06,
"loss": 0.502,
"step": 3325
},
{
"epoch": 0.13,
"learning_rate": 9.943023023023024e-06,
"loss": 0.495,
"step": 3350
},
{
"epoch": 0.13,
"learning_rate": 9.942522522522523e-06,
"loss": 0.519,
"step": 3375
},
{
"epoch": 0.14,
"learning_rate": 9.942022022022022e-06,
"loss": 0.5351,
"step": 3400
},
{
"epoch": 0.14,
"learning_rate": 9.941521521521522e-06,
"loss": 0.4833,
"step": 3425
},
{
"epoch": 0.14,
"learning_rate": 9.941021021021023e-06,
"loss": 0.5227,
"step": 3450
},
{
"epoch": 0.14,
"learning_rate": 9.940520520520522e-06,
"loss": 0.4969,
"step": 3475
},
{
"epoch": 0.14,
"learning_rate": 9.94002002002002e-06,
"loss": 0.5103,
"step": 3500
},
{
"epoch": 0.14,
"learning_rate": 9.93951951951952e-06,
"loss": 0.5109,
"step": 3525
},
{
"epoch": 0.14,
"learning_rate": 9.93901901901902e-06,
"loss": 0.5228,
"step": 3550
},
{
"epoch": 0.14,
"learning_rate": 9.938518518518519e-06,
"loss": 0.4983,
"step": 3575
},
{
"epoch": 0.14,
"learning_rate": 9.938018018018018e-06,
"loss": 0.4873,
"step": 3600
},
{
"epoch": 0.14,
"learning_rate": 9.93751751751752e-06,
"loss": 0.4955,
"step": 3625
},
{
"epoch": 0.15,
"learning_rate": 9.937017017017017e-06,
"loss": 0.5064,
"step": 3650
},
{
"epoch": 0.15,
"learning_rate": 9.936516516516518e-06,
"loss": 0.506,
"step": 3675
},
{
"epoch": 0.15,
"learning_rate": 9.936016016016017e-06,
"loss": 0.483,
"step": 3700
},
{
"epoch": 0.15,
"learning_rate": 9.935515515515517e-06,
"loss": 0.4931,
"step": 3725
},
{
"epoch": 0.15,
"learning_rate": 9.935015015015016e-06,
"loss": 0.4854,
"step": 3750
},
{
"epoch": 0.15,
"learning_rate": 9.934514514514515e-06,
"loss": 0.4697,
"step": 3775
},
{
"epoch": 0.15,
"learning_rate": 9.934014014014014e-06,
"loss": 0.5078,
"step": 3800
},
{
"epoch": 0.15,
"learning_rate": 9.933513513513514e-06,
"loss": 0.4759,
"step": 3825
},
{
"epoch": 0.15,
"learning_rate": 9.933013013013015e-06,
"loss": 0.5202,
"step": 3850
},
{
"epoch": 0.15,
"learning_rate": 9.932512512512514e-06,
"loss": 0.4633,
"step": 3875
},
{
"epoch": 0.16,
"learning_rate": 9.932012012012013e-06,
"loss": 0.4947,
"step": 3900
},
{
"epoch": 0.16,
"learning_rate": 9.931511511511513e-06,
"loss": 0.4952,
"step": 3925
},
{
"epoch": 0.16,
"learning_rate": 9.931011011011012e-06,
"loss": 0.4768,
"step": 3950
},
{
"epoch": 0.16,
"learning_rate": 9.930510510510511e-06,
"loss": 0.485,
"step": 3975
},
{
"epoch": 0.16,
"learning_rate": 9.93001001001001e-06,
"loss": 0.4855,
"step": 4000
},
{
"epoch": 0.16,
"eval_loss": 0.6402216553688049,
"eval_runtime": 2763.3301,
"eval_samples_per_second": 5.867,
"eval_steps_per_second": 0.147,
"eval_wer": 41.90377810840188,
"step": 4000
},
{
"epoch": 0.16,
"learning_rate": 9.92950950950951e-06,
"loss": 0.4653,
"step": 4025
},
{
"epoch": 0.16,
"learning_rate": 9.929009009009009e-06,
"loss": 0.4994,
"step": 4050
},
{
"epoch": 0.16,
"learning_rate": 9.92850850850851e-06,
"loss": 0.4641,
"step": 4075
},
{
"epoch": 0.16,
"learning_rate": 9.92800800800801e-06,
"loss": 0.4851,
"step": 4100
},
{
"epoch": 0.16,
"learning_rate": 9.927507507507507e-06,
"loss": 0.489,
"step": 4125
},
{
"epoch": 0.17,
"learning_rate": 9.927007007007008e-06,
"loss": 0.4881,
"step": 4150
},
{
"epoch": 0.17,
"learning_rate": 9.926506506506507e-06,
"loss": 0.4975,
"step": 4175
},
{
"epoch": 0.17,
"learning_rate": 9.926006006006007e-06,
"loss": 0.4785,
"step": 4200
},
{
"epoch": 0.17,
"learning_rate": 9.925505505505506e-06,
"loss": 0.4689,
"step": 4225
},
{
"epoch": 0.17,
"learning_rate": 9.925005005005007e-06,
"loss": 0.4688,
"step": 4250
},
{
"epoch": 0.17,
"learning_rate": 9.924504504504505e-06,
"loss": 0.4842,
"step": 4275
},
{
"epoch": 0.17,
"learning_rate": 9.924004004004006e-06,
"loss": 0.462,
"step": 4300
},
{
"epoch": 0.17,
"learning_rate": 9.923503503503505e-06,
"loss": 0.4674,
"step": 4325
},
{
"epoch": 0.17,
"learning_rate": 9.923003003003004e-06,
"loss": 0.4632,
"step": 4350
},
{
"epoch": 0.17,
"learning_rate": 9.922502502502503e-06,
"loss": 0.4618,
"step": 4375
},
{
"epoch": 0.18,
"learning_rate": 9.922002002002003e-06,
"loss": 0.4655,
"step": 4400
},
{
"epoch": 0.18,
"learning_rate": 9.921501501501502e-06,
"loss": 0.4557,
"step": 4425
},
{
"epoch": 0.18,
"learning_rate": 9.921001001001001e-06,
"loss": 0.4549,
"step": 4450
},
{
"epoch": 0.18,
"learning_rate": 9.920500500500502e-06,
"loss": 0.4757,
"step": 4475
},
{
"epoch": 0.18,
"learning_rate": 9.920000000000002e-06,
"loss": 0.4501,
"step": 4500
},
{
"epoch": 0.18,
"learning_rate": 9.919499499499501e-06,
"loss": 0.4789,
"step": 4525
},
{
"epoch": 0.18,
"learning_rate": 9.918998998999e-06,
"loss": 0.4768,
"step": 4550
},
{
"epoch": 0.18,
"learning_rate": 9.9184984984985e-06,
"loss": 0.4799,
"step": 4575
},
{
"epoch": 0.18,
"learning_rate": 9.917997997997999e-06,
"loss": 0.4648,
"step": 4600
},
{
"epoch": 0.18,
"learning_rate": 9.917497497497498e-06,
"loss": 0.4671,
"step": 4625
},
{
"epoch": 0.19,
"learning_rate": 9.916996996996997e-06,
"loss": 0.4672,
"step": 4650
},
{
"epoch": 0.19,
"learning_rate": 9.916496496496497e-06,
"loss": 0.4664,
"step": 4675
},
{
"epoch": 0.19,
"learning_rate": 9.915995995995998e-06,
"loss": 0.4769,
"step": 4700
},
{
"epoch": 0.19,
"learning_rate": 9.915495495495497e-06,
"loss": 0.4828,
"step": 4725
},
{
"epoch": 0.19,
"learning_rate": 9.914994994994995e-06,
"loss": 0.4648,
"step": 4750
},
{
"epoch": 0.19,
"learning_rate": 9.914494494494496e-06,
"loss": 0.4501,
"step": 4775
},
{
"epoch": 0.19,
"learning_rate": 9.913993993993995e-06,
"loss": 0.4638,
"step": 4800
},
{
"epoch": 0.19,
"learning_rate": 9.913493493493494e-06,
"loss": 0.463,
"step": 4825
},
{
"epoch": 0.19,
"learning_rate": 9.912992992992993e-06,
"loss": 0.4759,
"step": 4850
},
{
"epoch": 0.19,
"learning_rate": 9.912492492492494e-06,
"loss": 0.4967,
"step": 4875
},
{
"epoch": 0.2,
"learning_rate": 9.911991991991992e-06,
"loss": 0.4483,
"step": 4900
},
{
"epoch": 0.2,
"learning_rate": 9.911491491491493e-06,
"loss": 0.4514,
"step": 4925
},
{
"epoch": 0.2,
"learning_rate": 9.910990990990992e-06,
"loss": 0.482,
"step": 4950
},
{
"epoch": 0.2,
"learning_rate": 9.910490490490492e-06,
"loss": 0.4439,
"step": 4975
},
{
"epoch": 0.2,
"learning_rate": 9.909989989989991e-06,
"loss": 0.4379,
"step": 5000
},
{
"epoch": 0.2,
"eval_loss": 0.6058462858200073,
"eval_runtime": 2619.0085,
"eval_samples_per_second": 6.191,
"eval_steps_per_second": 0.155,
"eval_wer": 38.43171113389505,
"step": 5000
},
{
"epoch": 0.2,
"learning_rate": 9.90948948948949e-06,
"loss": 0.4567,
"step": 5025
},
{
"epoch": 0.2,
"learning_rate": 9.90898898898899e-06,
"loss": 0.4506,
"step": 5050
},
{
"epoch": 0.2,
"learning_rate": 9.908488488488489e-06,
"loss": 0.4717,
"step": 5075
},
{
"epoch": 0.2,
"learning_rate": 9.90798798798799e-06,
"loss": 0.4775,
"step": 5100
},
{
"epoch": 0.2,
"learning_rate": 9.907487487487487e-06,
"loss": 0.4344,
"step": 5125
},
{
"epoch": 0.21,
"learning_rate": 9.906986986986987e-06,
"loss": 0.4462,
"step": 5150
},
{
"epoch": 0.21,
"learning_rate": 9.906486486486488e-06,
"loss": 0.4492,
"step": 5175
},
{
"epoch": 0.21,
"learning_rate": 9.905985985985987e-06,
"loss": 0.4532,
"step": 5200
},
{
"epoch": 0.21,
"learning_rate": 9.905485485485486e-06,
"loss": 0.4595,
"step": 5225
},
{
"epoch": 0.21,
"learning_rate": 9.904984984984986e-06,
"loss": 0.4369,
"step": 5250
},
{
"epoch": 0.21,
"learning_rate": 9.904484484484485e-06,
"loss": 0.4668,
"step": 5275
},
{
"epoch": 0.21,
"learning_rate": 9.903983983983984e-06,
"loss": 0.4507,
"step": 5300
},
{
"epoch": 0.21,
"learning_rate": 9.903483483483485e-06,
"loss": 0.4438,
"step": 5325
},
{
"epoch": 0.21,
"learning_rate": 9.902982982982984e-06,
"loss": 0.4679,
"step": 5350
},
{
"epoch": 0.21,
"learning_rate": 9.902482482482482e-06,
"loss": 0.468,
"step": 5375
},
{
"epoch": 0.22,
"learning_rate": 9.901981981981983e-06,
"loss": 0.4502,
"step": 5400
},
{
"epoch": 0.22,
"learning_rate": 9.901481481481482e-06,
"loss": 0.4319,
"step": 5425
},
{
"epoch": 0.22,
"learning_rate": 9.900980980980982e-06,
"loss": 0.4799,
"step": 5450
},
{
"epoch": 0.22,
"learning_rate": 9.900480480480481e-06,
"loss": 0.4553,
"step": 5475
},
{
"epoch": 0.22,
"learning_rate": 9.899979979979982e-06,
"loss": 0.4309,
"step": 5500
},
{
"epoch": 0.22,
"learning_rate": 9.89947947947948e-06,
"loss": 0.4385,
"step": 5525
},
{
"epoch": 0.22,
"learning_rate": 9.89897897897898e-06,
"loss": 0.431,
"step": 5550
},
{
"epoch": 0.22,
"learning_rate": 9.89847847847848e-06,
"loss": 0.4478,
"step": 5575
},
{
"epoch": 0.22,
"learning_rate": 9.897977977977979e-06,
"loss": 0.4379,
"step": 5600
},
{
"epoch": 0.22,
"learning_rate": 9.897477477477478e-06,
"loss": 0.4334,
"step": 5625
},
{
"epoch": 0.23,
"learning_rate": 9.896976976976978e-06,
"loss": 0.4542,
"step": 5650
},
{
"epoch": 0.23,
"learning_rate": 9.896476476476477e-06,
"loss": 0.4454,
"step": 5675
},
{
"epoch": 0.23,
"learning_rate": 9.895975975975976e-06,
"loss": 0.4519,
"step": 5700
},
{
"epoch": 0.23,
"learning_rate": 9.895475475475477e-06,
"loss": 0.4625,
"step": 5725
},
{
"epoch": 0.23,
"learning_rate": 9.894974974974975e-06,
"loss": 0.4361,
"step": 5750
},
{
"epoch": 0.23,
"learning_rate": 9.894474474474474e-06,
"loss": 0.4305,
"step": 5775
},
{
"epoch": 0.23,
"learning_rate": 9.893973973973975e-06,
"loss": 0.4558,
"step": 5800
},
{
"epoch": 0.23,
"learning_rate": 9.893473473473475e-06,
"loss": 0.4554,
"step": 5825
},
{
"epoch": 0.23,
"learning_rate": 9.892972972972974e-06,
"loss": 0.4562,
"step": 5850
},
{
"epoch": 0.23,
"learning_rate": 9.892472472472473e-06,
"loss": 0.4378,
"step": 5875
},
{
"epoch": 0.24,
"learning_rate": 9.891971971971972e-06,
"loss": 0.464,
"step": 5900
},
{
"epoch": 0.24,
"learning_rate": 9.891471471471472e-06,
"loss": 0.4279,
"step": 5925
},
{
"epoch": 0.24,
"learning_rate": 9.890970970970973e-06,
"loss": 0.4414,
"step": 5950
},
{
"epoch": 0.24,
"learning_rate": 9.890470470470472e-06,
"loss": 0.4537,
"step": 5975
},
{
"epoch": 0.24,
"learning_rate": 9.88996996996997e-06,
"loss": 0.4399,
"step": 6000
},
{
"epoch": 0.24,
"eval_loss": 0.5941766500473022,
"eval_runtime": 2644.5549,
"eval_samples_per_second": 6.131,
"eval_steps_per_second": 0.154,
"eval_wer": 37.588362716907824,
"step": 6000
},
{
"epoch": 0.24,
"learning_rate": 9.88946946946947e-06,
"loss": 0.4419,
"step": 6025
},
{
"epoch": 0.24,
"learning_rate": 9.88896896896897e-06,
"loss": 0.4219,
"step": 6050
},
{
"epoch": 0.24,
"learning_rate": 9.88846846846847e-06,
"loss": 0.4271,
"step": 6075
},
{
"epoch": 0.24,
"learning_rate": 9.887967967967968e-06,
"loss": 0.4565,
"step": 6100
},
{
"epoch": 0.24,
"learning_rate": 9.88746746746747e-06,
"loss": 0.4588,
"step": 6125
},
{
"epoch": 0.25,
"learning_rate": 9.886966966966967e-06,
"loss": 0.4384,
"step": 6150
},
{
"epoch": 0.25,
"learning_rate": 9.886466466466468e-06,
"loss": 0.4341,
"step": 6175
},
{
"epoch": 0.25,
"learning_rate": 9.885965965965967e-06,
"loss": 0.4302,
"step": 6200
},
{
"epoch": 0.25,
"learning_rate": 9.885465465465467e-06,
"loss": 0.4307,
"step": 6225
},
{
"epoch": 0.25,
"learning_rate": 9.884964964964966e-06,
"loss": 0.4634,
"step": 6250
},
{
"epoch": 0.25,
"learning_rate": 9.884464464464465e-06,
"loss": 0.4374,
"step": 6275
},
{
"epoch": 0.25,
"learning_rate": 9.883963963963965e-06,
"loss": 0.4352,
"step": 6300
},
{
"epoch": 0.25,
"learning_rate": 9.883463463463464e-06,
"loss": 0.4376,
"step": 6325
},
{
"epoch": 0.25,
"learning_rate": 9.882962962962965e-06,
"loss": 0.4284,
"step": 6350
},
{
"epoch": 0.25,
"learning_rate": 9.882462462462462e-06,
"loss": 0.4143,
"step": 6375
},
{
"epoch": 0.26,
"learning_rate": 9.881961961961962e-06,
"loss": 0.4286,
"step": 6400
},
{
"epoch": 0.26,
"learning_rate": 9.881461461461463e-06,
"loss": 0.4358,
"step": 6425
},
{
"epoch": 0.26,
"learning_rate": 9.880960960960962e-06,
"loss": 0.4306,
"step": 6450
},
{
"epoch": 0.26,
"learning_rate": 9.880460460460461e-06,
"loss": 0.4357,
"step": 6475
},
{
"epoch": 0.26,
"learning_rate": 9.87995995995996e-06,
"loss": 0.4344,
"step": 6500
},
{
"epoch": 0.26,
"learning_rate": 9.87945945945946e-06,
"loss": 0.4508,
"step": 6525
},
{
"epoch": 0.26,
"learning_rate": 9.87895895895896e-06,
"loss": 0.441,
"step": 6550
},
{
"epoch": 0.26,
"learning_rate": 9.87845845845846e-06,
"loss": 0.419,
"step": 6575
},
{
"epoch": 0.26,
"learning_rate": 9.87795795795796e-06,
"loss": 0.4221,
"step": 6600
},
{
"epoch": 0.26,
"learning_rate": 9.877457457457457e-06,
"loss": 0.4288,
"step": 6625
},
{
"epoch": 0.27,
"learning_rate": 9.876956956956958e-06,
"loss": 0.4288,
"step": 6650
},
{
"epoch": 0.27,
"learning_rate": 9.876456456456457e-06,
"loss": 0.4314,
"step": 6675
},
{
"epoch": 0.27,
"learning_rate": 9.875955955955957e-06,
"loss": 0.4138,
"step": 6700
},
{
"epoch": 0.27,
"learning_rate": 9.875455455455456e-06,
"loss": 0.4291,
"step": 6725
},
{
"epoch": 0.27,
"learning_rate": 9.874954954954957e-06,
"loss": 0.4446,
"step": 6750
},
{
"epoch": 0.27,
"learning_rate": 9.874454454454455e-06,
"loss": 0.4153,
"step": 6775
},
{
"epoch": 0.27,
"learning_rate": 9.873953953953956e-06,
"loss": 0.4325,
"step": 6800
},
{
"epoch": 0.27,
"learning_rate": 9.873453453453455e-06,
"loss": 0.4158,
"step": 6825
},
{
"epoch": 0.27,
"learning_rate": 9.872952952952952e-06,
"loss": 0.4248,
"step": 6850
},
{
"epoch": 0.27,
"learning_rate": 9.872452452452453e-06,
"loss": 0.4221,
"step": 6875
},
{
"epoch": 0.28,
"learning_rate": 9.871951951951953e-06,
"loss": 0.4206,
"step": 6900
},
{
"epoch": 0.28,
"learning_rate": 9.871451451451452e-06,
"loss": 0.4173,
"step": 6925
},
{
"epoch": 0.28,
"learning_rate": 9.870950950950951e-06,
"loss": 0.4285,
"step": 6950
},
{
"epoch": 0.28,
"learning_rate": 9.870450450450452e-06,
"loss": 0.4102,
"step": 6975
},
{
"epoch": 0.28,
"learning_rate": 9.86994994994995e-06,
"loss": 0.4335,
"step": 7000
},
{
"epoch": 0.28,
"eval_loss": 0.5607422590255737,
"eval_runtime": 2701.8903,
"eval_samples_per_second": 6.001,
"eval_steps_per_second": 0.15,
"eval_wer": 36.83443698398872,
"step": 7000
},
{
"epoch": 0.28,
"learning_rate": 9.86944944944945e-06,
"loss": 0.4267,
"step": 7025
},
{
"epoch": 0.28,
"learning_rate": 9.86894894894895e-06,
"loss": 0.439,
"step": 7050
},
{
"epoch": 0.28,
"learning_rate": 9.86844844844845e-06,
"loss": 0.4139,
"step": 7075
},
{
"epoch": 0.28,
"learning_rate": 9.867947947947949e-06,
"loss": 0.4248,
"step": 7100
},
{
"epoch": 0.28,
"learning_rate": 9.867447447447448e-06,
"loss": 0.4279,
"step": 7125
},
{
"epoch": 0.29,
"learning_rate": 9.866946946946947e-06,
"loss": 0.4172,
"step": 7150
},
{
"epoch": 0.29,
"learning_rate": 9.866446446446447e-06,
"loss": 0.4382,
"step": 7175
},
{
"epoch": 0.29,
"learning_rate": 9.865945945945948e-06,
"loss": 0.4367,
"step": 7200
},
{
"epoch": 0.29,
"learning_rate": 9.865445445445447e-06,
"loss": 0.4247,
"step": 7225
},
{
"epoch": 0.29,
"learning_rate": 9.864944944944945e-06,
"loss": 0.4223,
"step": 7250
},
{
"epoch": 0.29,
"learning_rate": 9.864444444444446e-06,
"loss": 0.4207,
"step": 7275
},
{
"epoch": 0.29,
"learning_rate": 9.863943943943945e-06,
"loss": 0.4166,
"step": 7300
},
{
"epoch": 0.29,
"learning_rate": 9.863443443443444e-06,
"loss": 0.4155,
"step": 7325
},
{
"epoch": 0.29,
"learning_rate": 9.862942942942944e-06,
"loss": 0.4131,
"step": 7350
},
{
"epoch": 0.29,
"learning_rate": 9.862442442442443e-06,
"loss": 0.4,
"step": 7375
},
{
"epoch": 0.3,
"learning_rate": 9.861941941941942e-06,
"loss": 0.4051,
"step": 7400
},
{
"epoch": 0.3,
"learning_rate": 9.861441441441443e-06,
"loss": 0.3976,
"step": 7425
},
{
"epoch": 0.3,
"learning_rate": 9.860940940940942e-06,
"loss": 0.4396,
"step": 7450
},
{
"epoch": 0.3,
"learning_rate": 9.86044044044044e-06,
"loss": 0.3999,
"step": 7475
},
{
"epoch": 0.3,
"learning_rate": 9.859939939939941e-06,
"loss": 0.4167,
"step": 7500
},
{
"epoch": 0.3,
"learning_rate": 9.85943943943944e-06,
"loss": 0.4324,
"step": 7525
},
{
"epoch": 0.3,
"learning_rate": 9.85893893893894e-06,
"loss": 0.4185,
"step": 7550
},
{
"epoch": 0.3,
"learning_rate": 9.858438438438439e-06,
"loss": 0.4205,
"step": 7575
},
{
"epoch": 0.3,
"learning_rate": 9.85793793793794e-06,
"loss": 0.4011,
"step": 7600
},
{
"epoch": 0.3,
"learning_rate": 9.857437437437437e-06,
"loss": 0.4032,
"step": 7625
},
{
"epoch": 0.31,
"learning_rate": 9.856936936936937e-06,
"loss": 0.4223,
"step": 7650
},
{
"epoch": 0.31,
"learning_rate": 9.856436436436438e-06,
"loss": 0.4024,
"step": 7675
},
{
"epoch": 0.31,
"learning_rate": 9.855935935935937e-06,
"loss": 0.4071,
"step": 7700
},
{
"epoch": 0.31,
"learning_rate": 9.855435435435436e-06,
"loss": 0.4024,
"step": 7725
},
{
"epoch": 0.31,
"learning_rate": 9.854934934934936e-06,
"loss": 0.3904,
"step": 7750
},
{
"epoch": 0.31,
"learning_rate": 9.854434434434435e-06,
"loss": 0.4041,
"step": 7775
},
{
"epoch": 0.31,
"learning_rate": 9.853933933933934e-06,
"loss": 0.4201,
"step": 7800
},
{
"epoch": 0.31,
"learning_rate": 9.853433433433435e-06,
"loss": 0.393,
"step": 7825
},
{
"epoch": 0.31,
"learning_rate": 9.852932932932935e-06,
"loss": 0.4405,
"step": 7850
},
{
"epoch": 0.31,
"learning_rate": 9.852432432432432e-06,
"loss": 0.402,
"step": 7875
},
{
"epoch": 0.32,
"learning_rate": 9.851931931931933e-06,
"loss": 0.4064,
"step": 7900
},
{
"epoch": 0.32,
"learning_rate": 9.851431431431432e-06,
"loss": 0.3908,
"step": 7925
},
{
"epoch": 0.32,
"learning_rate": 9.850930930930932e-06,
"loss": 0.4232,
"step": 7950
},
{
"epoch": 0.32,
"learning_rate": 9.850430430430431e-06,
"loss": 0.4311,
"step": 7975
},
{
"epoch": 0.32,
"learning_rate": 9.84992992992993e-06,
"loss": 0.4266,
"step": 8000
},
{
"epoch": 0.32,
"eval_loss": 0.5630306601524353,
"eval_runtime": 2643.0014,
"eval_samples_per_second": 6.134,
"eval_steps_per_second": 0.154,
"eval_wer": 34.73531656401045,
"step": 8000
},
{
"epoch": 0.32,
"learning_rate": 9.84942942942943e-06,
"loss": 0.4117,
"step": 8025
},
{
"epoch": 0.32,
"learning_rate": 9.84894894894895e-06,
"loss": 0.3983,
"step": 8050
},
{
"epoch": 0.32,
"learning_rate": 9.848448448448448e-06,
"loss": 0.4025,
"step": 8075
},
{
"epoch": 0.32,
"learning_rate": 9.847947947947949e-06,
"loss": 0.4119,
"step": 8100
},
{
"epoch": 0.32,
"learning_rate": 9.847447447447448e-06,
"loss": 0.4135,
"step": 8125
},
{
"epoch": 0.33,
"learning_rate": 9.846946946946948e-06,
"loss": 0.4048,
"step": 8150
},
{
"epoch": 0.33,
"learning_rate": 9.846446446446447e-06,
"loss": 0.4371,
"step": 8175
},
{
"epoch": 0.33,
"learning_rate": 9.845945945945948e-06,
"loss": 0.3954,
"step": 8200
},
{
"epoch": 0.33,
"learning_rate": 9.845445445445446e-06,
"loss": 0.3933,
"step": 8225
},
{
"epoch": 0.33,
"learning_rate": 9.844944944944945e-06,
"loss": 0.3956,
"step": 8250
},
{
"epoch": 0.33,
"learning_rate": 9.844444444444446e-06,
"loss": 0.4109,
"step": 8275
},
{
"epoch": 0.33,
"learning_rate": 9.843943943943945e-06,
"loss": 0.4087,
"step": 8300
},
{
"epoch": 0.33,
"learning_rate": 9.843443443443444e-06,
"loss": 0.3904,
"step": 8325
},
{
"epoch": 0.33,
"learning_rate": 9.842942942942944e-06,
"loss": 0.4309,
"step": 8350
},
{
"epoch": 0.33,
"learning_rate": 9.842442442442443e-06,
"loss": 0.411,
"step": 8375
},
{
"epoch": 0.33,
"learning_rate": 9.841941941941942e-06,
"loss": 0.384,
"step": 8400
},
{
"epoch": 0.34,
"learning_rate": 9.841441441441443e-06,
"loss": 0.3993,
"step": 8425
},
{
"epoch": 0.34,
"learning_rate": 9.840940940940943e-06,
"loss": 0.3931,
"step": 8450
},
{
"epoch": 0.34,
"learning_rate": 9.84044044044044e-06,
"loss": 0.4044,
"step": 8475
},
{
"epoch": 0.34,
"learning_rate": 9.839939939939941e-06,
"loss": 0.3985,
"step": 8500
},
{
"epoch": 0.34,
"learning_rate": 9.83943943943944e-06,
"loss": 0.4317,
"step": 8525
},
{
"epoch": 0.34,
"learning_rate": 9.83893893893894e-06,
"loss": 0.3932,
"step": 8550
},
{
"epoch": 0.34,
"learning_rate": 9.838438438438439e-06,
"loss": 0.3925,
"step": 8575
},
{
"epoch": 0.34,
"learning_rate": 9.837937937937938e-06,
"loss": 0.3799,
"step": 8600
},
{
"epoch": 0.34,
"learning_rate": 9.837437437437438e-06,
"loss": 0.3975,
"step": 8625
},
{
"epoch": 0.34,
"learning_rate": 9.836936936936937e-06,
"loss": 0.4047,
"step": 8650
},
{
"epoch": 0.35,
"learning_rate": 9.836436436436438e-06,
"loss": 0.4092,
"step": 8675
},
{
"epoch": 0.35,
"learning_rate": 9.835935935935936e-06,
"loss": 0.3945,
"step": 8700
},
{
"epoch": 0.35,
"learning_rate": 9.835435435435437e-06,
"loss": 0.4068,
"step": 8725
},
{
"epoch": 0.35,
"learning_rate": 9.834934934934936e-06,
"loss": 0.3877,
"step": 8750
},
{
"epoch": 0.35,
"learning_rate": 9.834434434434435e-06,
"loss": 0.3949,
"step": 8775
},
{
"epoch": 0.35,
"learning_rate": 9.833933933933934e-06,
"loss": 0.3841,
"step": 8800
},
{
"epoch": 0.35,
"learning_rate": 9.833433433433435e-06,
"loss": 0.4074,
"step": 8825
},
{
"epoch": 0.35,
"learning_rate": 9.832932932932933e-06,
"loss": 0.4171,
"step": 8850
},
{
"epoch": 0.35,
"learning_rate": 9.832452452452454e-06,
"loss": 0.3953,
"step": 8875
},
{
"epoch": 0.35,
"learning_rate": 9.831951951951953e-06,
"loss": 0.3761,
"step": 8900
},
{
"epoch": 0.36,
"learning_rate": 9.831451451451452e-06,
"loss": 0.4115,
"step": 8925
},
{
"epoch": 0.36,
"learning_rate": 9.830950950950952e-06,
"loss": 0.3979,
"step": 8950
},
{
"epoch": 0.36,
"learning_rate": 9.830450450450451e-06,
"loss": 0.405,
"step": 8975
},
{
"epoch": 0.36,
"learning_rate": 9.82994994994995e-06,
"loss": 0.4057,
"step": 9000
},
{
"epoch": 0.36,
"eval_loss": 0.5405702590942383,
"eval_runtime": 2698.8083,
"eval_samples_per_second": 6.007,
"eval_steps_per_second": 0.15,
"eval_wer": 34.710648237370975,
"step": 9000
},
{
"epoch": 0.36,
"learning_rate": 9.829449449449451e-06,
"loss": 0.3833,
"step": 9025
},
{
"epoch": 0.36,
"learning_rate": 9.82894894894895e-06,
"loss": 0.4058,
"step": 9050
},
{
"epoch": 0.36,
"learning_rate": 9.828448448448448e-06,
"loss": 0.3861,
"step": 9075
},
{
"epoch": 0.36,
"learning_rate": 9.82794794794795e-06,
"loss": 0.4031,
"step": 9100
},
{
"epoch": 0.36,
"learning_rate": 9.827447447447449e-06,
"loss": 0.3894,
"step": 9125
},
{
"epoch": 0.36,
"learning_rate": 9.826946946946948e-06,
"loss": 0.3892,
"step": 9150
},
{
"epoch": 0.37,
"learning_rate": 9.826446446446447e-06,
"loss": 0.3991,
"step": 9175
},
{
"epoch": 0.37,
"learning_rate": 9.825945945945946e-06,
"loss": 0.3803,
"step": 9200
},
{
"epoch": 0.37,
"learning_rate": 9.825445445445446e-06,
"loss": 0.3927,
"step": 9225
},
{
"epoch": 0.37,
"learning_rate": 9.824944944944945e-06,
"loss": 0.4084,
"step": 9250
},
{
"epoch": 0.37,
"learning_rate": 9.824444444444446e-06,
"loss": 0.3916,
"step": 9275
},
{
"epoch": 0.37,
"learning_rate": 9.823943943943944e-06,
"loss": 0.3674,
"step": 9300
},
{
"epoch": 0.37,
"learning_rate": 9.823443443443445e-06,
"loss": 0.3683,
"step": 9325
},
{
"epoch": 0.37,
"learning_rate": 9.822942942942944e-06,
"loss": 0.4016,
"step": 9350
},
{
"epoch": 0.37,
"learning_rate": 9.822442442442443e-06,
"loss": 0.395,
"step": 9375
},
{
"epoch": 0.37,
"learning_rate": 9.821941941941942e-06,
"loss": 0.3906,
"step": 9400
},
{
"epoch": 0.38,
"learning_rate": 9.821441441441443e-06,
"loss": 0.3843,
"step": 9425
},
{
"epoch": 0.38,
"learning_rate": 9.820940940940941e-06,
"loss": 0.3732,
"step": 9450
},
{
"epoch": 0.38,
"learning_rate": 9.82044044044044e-06,
"loss": 0.3927,
"step": 9475
},
{
"epoch": 0.38,
"learning_rate": 9.819939939939941e-06,
"loss": 0.4151,
"step": 9500
},
{
"epoch": 0.38,
"learning_rate": 9.81943943943944e-06,
"loss": 0.3933,
"step": 9525
},
{
"epoch": 0.38,
"learning_rate": 9.81893893893894e-06,
"loss": 0.3856,
"step": 9550
},
{
"epoch": 0.38,
"learning_rate": 9.81843843843844e-06,
"loss": 0.3818,
"step": 9575
},
{
"epoch": 0.38,
"learning_rate": 9.817937937937939e-06,
"loss": 0.3932,
"step": 9600
},
{
"epoch": 0.38,
"learning_rate": 9.817437437437438e-06,
"loss": 0.4085,
"step": 9625
},
{
"epoch": 0.38,
"learning_rate": 9.816936936936939e-06,
"loss": 0.4023,
"step": 9650
},
{
"epoch": 0.39,
"learning_rate": 9.816436436436436e-06,
"loss": 0.3918,
"step": 9675
},
{
"epoch": 0.39,
"learning_rate": 9.815935935935936e-06,
"loss": 0.3965,
"step": 9700
},
{
"epoch": 0.39,
"learning_rate": 9.815435435435437e-06,
"loss": 0.3934,
"step": 9725
},
{
"epoch": 0.39,
"learning_rate": 9.814934934934936e-06,
"loss": 0.3807,
"step": 9750
},
{
"epoch": 0.39,
"learning_rate": 9.814434434434435e-06,
"loss": 0.3809,
"step": 9775
},
{
"epoch": 0.39,
"learning_rate": 9.813933933933935e-06,
"loss": 0.3804,
"step": 9800
},
{
"epoch": 0.39,
"learning_rate": 9.813433433433434e-06,
"loss": 0.4112,
"step": 9825
},
{
"epoch": 0.39,
"learning_rate": 9.812932932932933e-06,
"loss": 0.3853,
"step": 9850
},
{
"epoch": 0.39,
"learning_rate": 9.812432432432433e-06,
"loss": 0.3967,
"step": 9875
},
{
"epoch": 0.39,
"learning_rate": 9.811931931931934e-06,
"loss": 0.3934,
"step": 9900
},
{
"epoch": 0.4,
"learning_rate": 9.811431431431431e-06,
"loss": 0.4013,
"step": 9925
},
{
"epoch": 0.4,
"learning_rate": 9.810930930930932e-06,
"loss": 0.4004,
"step": 9950
},
{
"epoch": 0.4,
"learning_rate": 9.810430430430431e-06,
"loss": 0.3825,
"step": 9975
},
{
"epoch": 0.4,
"learning_rate": 9.80992992992993e-06,
"loss": 0.3798,
"step": 10000
},
{
"epoch": 0.4,
"eval_loss": 0.5242385864257812,
"eval_runtime": 2613.1802,
"eval_samples_per_second": 6.204,
"eval_steps_per_second": 0.155,
"eval_wer": 32.9584261607604,
"step": 10000
},
{
"epoch": 0.4,
"learning_rate": 9.80942942942943e-06,
"loss": 0.379,
"step": 10025
},
{
"epoch": 0.4,
"learning_rate": 9.808928928928931e-06,
"loss": 0.397,
"step": 10050
},
{
"epoch": 0.4,
"learning_rate": 9.808428428428429e-06,
"loss": 0.3818,
"step": 10075
},
{
"epoch": 0.4,
"learning_rate": 9.807927927927928e-06,
"loss": 0.373,
"step": 10100
},
{
"epoch": 0.4,
"learning_rate": 9.807427427427429e-06,
"loss": 0.3592,
"step": 10125
},
{
"epoch": 0.4,
"learning_rate": 9.806926926926928e-06,
"loss": 0.3824,
"step": 10150
},
{
"epoch": 0.41,
"learning_rate": 9.806426426426427e-06,
"loss": 0.3907,
"step": 10175
},
{
"epoch": 0.41,
"learning_rate": 9.805925925925927e-06,
"loss": 0.3787,
"step": 10200
},
{
"epoch": 0.41,
"learning_rate": 9.805425425425426e-06,
"loss": 0.3571,
"step": 10225
},
{
"epoch": 0.41,
"learning_rate": 9.804924924924925e-06,
"loss": 0.3785,
"step": 10250
},
{
"epoch": 0.41,
"learning_rate": 9.804424424424426e-06,
"loss": 0.41,
"step": 10275
},
{
"epoch": 0.41,
"learning_rate": 9.803923923923924e-06,
"loss": 0.3703,
"step": 10300
},
{
"epoch": 0.41,
"learning_rate": 9.803423423423423e-06,
"loss": 0.38,
"step": 10325
},
{
"epoch": 0.41,
"learning_rate": 9.802922922922924e-06,
"loss": 0.3787,
"step": 10350
},
{
"epoch": 0.41,
"learning_rate": 9.802422422422424e-06,
"loss": 0.3948,
"step": 10375
},
{
"epoch": 0.41,
"learning_rate": 9.801921921921923e-06,
"loss": 0.3775,
"step": 10400
},
{
"epoch": 0.42,
"learning_rate": 9.801421421421422e-06,
"loss": 0.3823,
"step": 10425
},
{
"epoch": 0.42,
"learning_rate": 9.800920920920921e-06,
"loss": 0.3868,
"step": 10450
},
{
"epoch": 0.42,
"learning_rate": 9.80042042042042e-06,
"loss": 0.378,
"step": 10475
},
{
"epoch": 0.42,
"learning_rate": 9.79991991991992e-06,
"loss": 0.3911,
"step": 10500
},
{
"epoch": 0.42,
"learning_rate": 9.799419419419421e-06,
"loss": 0.3845,
"step": 10525
},
{
"epoch": 0.42,
"learning_rate": 9.798918918918919e-06,
"loss": 0.3899,
"step": 10550
},
{
"epoch": 0.42,
"learning_rate": 9.79841841841842e-06,
"loss": 0.3919,
"step": 10575
},
{
"epoch": 0.42,
"learning_rate": 9.797917917917919e-06,
"loss": 0.4163,
"step": 10600
},
{
"epoch": 0.42,
"learning_rate": 9.797417417417418e-06,
"loss": 0.382,
"step": 10625
},
{
"epoch": 0.42,
"learning_rate": 9.796916916916918e-06,
"loss": 0.3796,
"step": 10650
},
{
"epoch": 0.43,
"learning_rate": 9.796416416416419e-06,
"loss": 0.3751,
"step": 10675
},
{
"epoch": 0.43,
"learning_rate": 9.795915915915916e-06,
"loss": 0.3768,
"step": 10700
},
{
"epoch": 0.43,
"learning_rate": 9.795415415415415e-06,
"loss": 0.3878,
"step": 10725
},
{
"epoch": 0.43,
"learning_rate": 9.794914914914916e-06,
"loss": 0.3821,
"step": 10750
},
{
"epoch": 0.43,
"learning_rate": 9.794414414414416e-06,
"loss": 0.3879,
"step": 10775
},
{
"epoch": 0.43,
"learning_rate": 9.793913913913915e-06,
"loss": 0.3685,
"step": 10800
},
{
"epoch": 0.43,
"learning_rate": 9.793413413413414e-06,
"loss": 0.3673,
"step": 10825
},
{
"epoch": 0.43,
"learning_rate": 9.792912912912914e-06,
"loss": 0.3955,
"step": 10850
},
{
"epoch": 0.43,
"learning_rate": 9.792412412412413e-06,
"loss": 0.3616,
"step": 10875
},
{
"epoch": 0.43,
"learning_rate": 9.791911911911914e-06,
"loss": 0.3692,
"step": 10900
},
{
"epoch": 0.44,
"learning_rate": 9.791411411411411e-06,
"loss": 0.3766,
"step": 10925
},
{
"epoch": 0.44,
"learning_rate": 9.79091091091091e-06,
"loss": 0.3873,
"step": 10950
},
{
"epoch": 0.44,
"learning_rate": 9.790410410410412e-06,
"loss": 0.3792,
"step": 10975
},
{
"epoch": 0.44,
"learning_rate": 9.789909909909911e-06,
"loss": 0.3781,
"step": 11000
},
{
"epoch": 0.44,
"eval_loss": 0.5272489190101624,
"eval_runtime": 2804.5214,
"eval_samples_per_second": 5.781,
"eval_steps_per_second": 0.145,
"eval_wer": 34.24349180163582,
"step": 11000
},
{
"epoch": 0.44,
"learning_rate": 9.78940940940941e-06,
"loss": 0.3926,
"step": 11025
},
{
"epoch": 0.44,
"learning_rate": 9.78890890890891e-06,
"loss": 0.3849,
"step": 11050
},
{
"epoch": 0.44,
"learning_rate": 9.788408408408409e-06,
"loss": 0.3726,
"step": 11075
},
{
"epoch": 0.44,
"learning_rate": 9.787907907907908e-06,
"loss": 0.3798,
"step": 11100
},
{
"epoch": 0.44,
"learning_rate": 9.787407407407408e-06,
"loss": 0.3877,
"step": 11125
},
{
"epoch": 0.44,
"learning_rate": 9.786906906906909e-06,
"loss": 0.3873,
"step": 11150
},
{
"epoch": 0.45,
"learning_rate": 9.786426426426428e-06,
"loss": 0.381,
"step": 11175
},
{
"epoch": 0.45,
"learning_rate": 9.785925925925927e-06,
"loss": 0.3769,
"step": 11200
},
{
"epoch": 0.45,
"learning_rate": 9.785425425425426e-06,
"loss": 0.3903,
"step": 11225
},
{
"epoch": 0.45,
"learning_rate": 9.784924924924926e-06,
"loss": 0.3778,
"step": 11250
},
{
"epoch": 0.45,
"learning_rate": 9.784424424424427e-06,
"loss": 0.3966,
"step": 11275
},
{
"epoch": 0.45,
"learning_rate": 9.783923923923924e-06,
"loss": 0.3851,
"step": 11300
},
{
"epoch": 0.45,
"learning_rate": 9.783423423423423e-06,
"loss": 0.3737,
"step": 11325
},
{
"epoch": 0.45,
"learning_rate": 9.782922922922924e-06,
"loss": 0.3602,
"step": 11350
},
{
"epoch": 0.45,
"learning_rate": 9.782422422422424e-06,
"loss": 0.3722,
"step": 11375
},
{
"epoch": 0.45,
"learning_rate": 9.781921921921923e-06,
"loss": 0.3874,
"step": 11400
},
{
"epoch": 0.46,
"learning_rate": 9.781421421421422e-06,
"loss": 0.3895,
"step": 11425
},
{
"epoch": 0.46,
"learning_rate": 9.780920920920922e-06,
"loss": 0.375,
"step": 11450
},
{
"epoch": 0.46,
"learning_rate": 9.780420420420421e-06,
"loss": 0.3858,
"step": 11475
},
{
"epoch": 0.46,
"learning_rate": 9.77991991991992e-06,
"loss": 0.3877,
"step": 11500
},
{
"epoch": 0.46,
"learning_rate": 9.77941941941942e-06,
"loss": 0.3932,
"step": 11525
},
{
"epoch": 0.46,
"learning_rate": 9.778918918918919e-06,
"loss": 0.3792,
"step": 11550
},
{
"epoch": 0.46,
"learning_rate": 9.77841841841842e-06,
"loss": 0.3709,
"step": 11575
},
{
"epoch": 0.46,
"learning_rate": 9.777917917917919e-06,
"loss": 0.3815,
"step": 11600
},
{
"epoch": 0.46,
"learning_rate": 9.777417417417418e-06,
"loss": 0.3834,
"step": 11625
},
{
"epoch": 0.46,
"learning_rate": 9.776916916916918e-06,
"loss": 0.3598,
"step": 11650
},
{
"epoch": 0.47,
"learning_rate": 9.776416416416417e-06,
"loss": 0.3648,
"step": 11675
},
{
"epoch": 0.47,
"learning_rate": 9.775915915915916e-06,
"loss": 0.3582,
"step": 11700
},
{
"epoch": 0.47,
"learning_rate": 9.775415415415416e-06,
"loss": 0.3753,
"step": 11725
},
{
"epoch": 0.47,
"learning_rate": 9.774914914914917e-06,
"loss": 0.3689,
"step": 11750
},
{
"epoch": 0.47,
"learning_rate": 9.774414414414414e-06,
"loss": 0.3774,
"step": 11775
},
{
"epoch": 0.47,
"learning_rate": 9.773913913913915e-06,
"loss": 0.3825,
"step": 11800
},
{
"epoch": 0.47,
"learning_rate": 9.773413413413414e-06,
"loss": 0.36,
"step": 11825
},
{
"epoch": 0.47,
"learning_rate": 9.772912912912914e-06,
"loss": 0.3672,
"step": 11850
},
{
"epoch": 0.47,
"learning_rate": 9.772412412412413e-06,
"loss": 0.3848,
"step": 11875
},
{
"epoch": 0.47,
"learning_rate": 9.771911911911914e-06,
"loss": 0.357,
"step": 11900
},
{
"epoch": 0.48,
"learning_rate": 9.771411411411412e-06,
"loss": 0.3658,
"step": 11925
},
{
"epoch": 0.48,
"learning_rate": 9.770910910910911e-06,
"loss": 0.3733,
"step": 11950
},
{
"epoch": 0.48,
"learning_rate": 9.770410410410412e-06,
"loss": 0.3731,
"step": 11975
},
{
"epoch": 0.48,
"learning_rate": 9.76990990990991e-06,
"loss": 0.3674,
"step": 12000
},
{
"epoch": 0.48,
"eval_loss": 0.5061578750610352,
"eval_runtime": 2740.8866,
"eval_samples_per_second": 5.915,
"eval_steps_per_second": 0.148,
"eval_wer": 33.014700780906715,
"step": 12000
},
{
"epoch": 0.48,
"learning_rate": 9.76940940940941e-06,
"loss": 0.3981,
"step": 12025
},
{
"epoch": 0.48,
"learning_rate": 9.76890890890891e-06,
"loss": 0.3759,
"step": 12050
},
{
"epoch": 0.48,
"learning_rate": 9.76840840840841e-06,
"loss": 0.3647,
"step": 12075
},
{
"epoch": 0.48,
"learning_rate": 9.767907907907908e-06,
"loss": 0.3756,
"step": 12100
},
{
"epoch": 0.48,
"learning_rate": 9.767407407407408e-06,
"loss": 0.3444,
"step": 12125
},
{
"epoch": 0.48,
"learning_rate": 9.766906906906907e-06,
"loss": 0.3536,
"step": 12150
},
{
"epoch": 0.49,
"learning_rate": 9.766406406406406e-06,
"loss": 0.3584,
"step": 12175
},
{
"epoch": 0.49,
"learning_rate": 9.765905905905907e-06,
"loss": 0.3879,
"step": 12200
},
{
"epoch": 0.49,
"learning_rate": 9.765405405405407e-06,
"loss": 0.3403,
"step": 12225
},
{
"epoch": 0.49,
"learning_rate": 9.764904904904906e-06,
"loss": 0.3646,
"step": 12250
},
{
"epoch": 0.49,
"learning_rate": 9.764404404404405e-06,
"loss": 0.3697,
"step": 12275
},
{
"epoch": 0.49,
"learning_rate": 9.763903903903905e-06,
"loss": 0.3607,
"step": 12300
},
{
"epoch": 0.49,
"learning_rate": 9.763403403403404e-06,
"loss": 0.3588,
"step": 12325
},
{
"epoch": 0.49,
"learning_rate": 9.762902902902903e-06,
"loss": 0.3668,
"step": 12350
},
{
"epoch": 0.49,
"learning_rate": 9.762402402402404e-06,
"loss": 0.3933,
"step": 12375
},
{
"epoch": 0.49,
"learning_rate": 9.761901901901902e-06,
"loss": 0.3744,
"step": 12400
},
{
"epoch": 0.5,
"learning_rate": 9.761401401401403e-06,
"loss": 0.3905,
"step": 12425
},
{
"epoch": 0.5,
"learning_rate": 9.760900900900902e-06,
"loss": 0.3641,
"step": 12450
},
{
"epoch": 0.5,
"learning_rate": 9.760400400400401e-06,
"loss": 0.3647,
"step": 12475
},
{
"epoch": 0.5,
"learning_rate": 9.7598998998999e-06,
"loss": 0.35,
"step": 12500
},
{
"epoch": 0.5,
"learning_rate": 9.7593993993994e-06,
"loss": 0.3545,
"step": 12525
},
{
"epoch": 0.5,
"learning_rate": 9.7588988988989e-06,
"loss": 0.3645,
"step": 12550
},
{
"epoch": 0.5,
"learning_rate": 9.758398398398398e-06,
"loss": 0.3625,
"step": 12575
},
{
"epoch": 0.5,
"learning_rate": 9.7578978978979e-06,
"loss": 0.3801,
"step": 12600
},
{
"epoch": 0.5,
"learning_rate": 9.757397397397397e-06,
"loss": 0.3562,
"step": 12625
},
{
"epoch": 0.5,
"learning_rate": 9.756896896896898e-06,
"loss": 0.3594,
"step": 12650
},
{
"epoch": 0.51,
"learning_rate": 9.756396396396397e-06,
"loss": 0.3644,
"step": 12675
},
{
"epoch": 0.51,
"learning_rate": 9.755895895895897e-06,
"loss": 0.356,
"step": 12700
},
{
"epoch": 0.51,
"learning_rate": 9.755395395395396e-06,
"loss": 0.3676,
"step": 12725
},
{
"epoch": 0.51,
"learning_rate": 9.754894894894895e-06,
"loss": 0.3722,
"step": 12750
},
{
"epoch": 0.51,
"learning_rate": 9.754394394394395e-06,
"loss": 0.396,
"step": 12775
},
{
"epoch": 0.51,
"learning_rate": 9.753893893893894e-06,
"loss": 0.3613,
"step": 12800
},
{
"epoch": 0.51,
"learning_rate": 9.753393393393395e-06,
"loss": 0.3626,
"step": 12825
},
{
"epoch": 0.51,
"learning_rate": 9.752892892892894e-06,
"loss": 0.3642,
"step": 12850
},
{
"epoch": 0.51,
"learning_rate": 9.752392392392393e-06,
"loss": 0.3674,
"step": 12875
},
{
"epoch": 0.51,
"learning_rate": 9.751891891891893e-06,
"loss": 0.3526,
"step": 12900
},
{
"epoch": 0.52,
"learning_rate": 9.751391391391392e-06,
"loss": 0.3767,
"step": 12925
},
{
"epoch": 0.52,
"learning_rate": 9.750890890890891e-06,
"loss": 0.3616,
"step": 12950
},
{
"epoch": 0.52,
"learning_rate": 9.75039039039039e-06,
"loss": 0.3475,
"step": 12975
},
{
"epoch": 0.52,
"learning_rate": 9.749889889889892e-06,
"loss": 0.3507,
"step": 13000
},
{
"epoch": 0.52,
"eval_loss": 0.49944427609443665,
"eval_runtime": 2897.6163,
"eval_samples_per_second": 5.595,
"eval_steps_per_second": 0.14,
"eval_wer": 33.72160251616932,
"step": 13000
},
{
"epoch": 0.52,
"learning_rate": 9.74938938938939e-06,
"loss": 0.3743,
"step": 13025
},
{
"epoch": 0.52,
"learning_rate": 9.74888888888889e-06,
"loss": 0.3597,
"step": 13050
},
{
"epoch": 0.52,
"learning_rate": 9.74838838838839e-06,
"loss": 0.3862,
"step": 13075
},
{
"epoch": 0.52,
"learning_rate": 9.747887887887889e-06,
"loss": 0.3606,
"step": 13100
},
{
"epoch": 0.52,
"learning_rate": 9.747387387387388e-06,
"loss": 0.4099,
"step": 13125
},
{
"epoch": 0.52,
"learning_rate": 9.746886886886887e-06,
"loss": 0.3583,
"step": 13150
},
{
"epoch": 0.53,
"learning_rate": 9.746386386386387e-06,
"loss": 0.3673,
"step": 13175
},
{
"epoch": 0.53,
"learning_rate": 9.745885885885886e-06,
"loss": 0.3597,
"step": 13200
},
{
"epoch": 0.53,
"learning_rate": 9.745385385385387e-06,
"loss": 0.3715,
"step": 13225
},
{
"epoch": 0.53,
"learning_rate": 9.744884884884885e-06,
"loss": 0.3681,
"step": 13250
},
{
"epoch": 0.53,
"learning_rate": 9.744384384384386e-06,
"loss": 0.3793,
"step": 13275
},
{
"epoch": 0.53,
"learning_rate": 9.743883883883885e-06,
"loss": 0.3574,
"step": 13300
},
{
"epoch": 0.53,
"learning_rate": 9.743383383383384e-06,
"loss": 0.3602,
"step": 13325
},
{
"epoch": 0.53,
"learning_rate": 9.742882882882883e-06,
"loss": 0.3663,
"step": 13350
},
{
"epoch": 0.53,
"learning_rate": 9.742382382382383e-06,
"loss": 0.3947,
"step": 13375
},
{
"epoch": 0.53,
"learning_rate": 9.741881881881882e-06,
"loss": 0.3709,
"step": 13400
},
{
"epoch": 0.54,
"learning_rate": 9.741381381381381e-06,
"loss": 0.3625,
"step": 13425
},
{
"epoch": 0.54,
"learning_rate": 9.740880880880882e-06,
"loss": 0.3574,
"step": 13450
},
{
"epoch": 0.54,
"learning_rate": 9.740380380380382e-06,
"loss": 0.3642,
"step": 13475
},
{
"epoch": 0.54,
"learning_rate": 9.739879879879881e-06,
"loss": 0.3639,
"step": 13500
},
{
"epoch": 0.54,
"learning_rate": 9.73937937937938e-06,
"loss": 0.3669,
"step": 13525
},
{
"epoch": 0.54,
"learning_rate": 9.73887887887888e-06,
"loss": 0.3762,
"step": 13550
},
{
"epoch": 0.54,
"learning_rate": 9.738378378378379e-06,
"loss": 0.3564,
"step": 13575
},
{
"epoch": 0.54,
"learning_rate": 9.737877877877878e-06,
"loss": 0.3602,
"step": 13600
},
{
"epoch": 0.54,
"learning_rate": 9.737377377377379e-06,
"loss": 0.3464,
"step": 13625
},
{
"epoch": 0.54,
"learning_rate": 9.736876876876877e-06,
"loss": 0.3618,
"step": 13650
},
{
"epoch": 0.55,
"learning_rate": 9.736376376376378e-06,
"loss": 0.3761,
"step": 13675
},
{
"epoch": 0.55,
"learning_rate": 9.735875875875877e-06,
"loss": 0.3604,
"step": 13700
},
{
"epoch": 0.55,
"learning_rate": 9.735375375375376e-06,
"loss": 0.3714,
"step": 13725
},
{
"epoch": 0.55,
"learning_rate": 9.734874874874876e-06,
"loss": 0.3699,
"step": 13750
},
{
"epoch": 0.55,
"learning_rate": 9.734374374374375e-06,
"loss": 0.3728,
"step": 13775
},
{
"epoch": 0.55,
"learning_rate": 9.733873873873874e-06,
"loss": 0.3878,
"step": 13800
},
{
"epoch": 0.55,
"learning_rate": 9.733373373373374e-06,
"loss": 0.3461,
"step": 13825
},
{
"epoch": 0.55,
"learning_rate": 9.732872872872875e-06,
"loss": 0.3415,
"step": 13850
},
{
"epoch": 0.55,
"learning_rate": 9.732372372372372e-06,
"loss": 0.3548,
"step": 13875
},
{
"epoch": 0.55,
"learning_rate": 9.731871871871873e-06,
"loss": 0.3729,
"step": 13900
},
{
"epoch": 0.56,
"learning_rate": 9.731371371371372e-06,
"loss": 0.3705,
"step": 13925
},
{
"epoch": 0.56,
"learning_rate": 9.730870870870872e-06,
"loss": 0.3605,
"step": 13950
},
{
"epoch": 0.56,
"learning_rate": 9.730370370370371e-06,
"loss": 0.3631,
"step": 13975
},
{
"epoch": 0.56,
"learning_rate": 9.72986986986987e-06,
"loss": 0.375,
"step": 14000
},
{
"epoch": 0.56,
"eval_loss": 0.5072089433670044,
"eval_runtime": 2512.5863,
"eval_samples_per_second": 6.453,
"eval_steps_per_second": 0.162,
"eval_wer": 30.171676135706633,
"step": 14000
},
{
"epoch": 0.56,
"learning_rate": 9.72936936936937e-06,
"loss": 0.3642,
"step": 14025
},
{
"epoch": 0.56,
"learning_rate": 9.728868868868869e-06,
"loss": 0.348,
"step": 14050
},
{
"epoch": 0.56,
"learning_rate": 9.72836836836837e-06,
"loss": 0.3413,
"step": 14075
},
{
"epoch": 0.56,
"learning_rate": 9.72786786786787e-06,
"loss": 0.3528,
"step": 14100
},
{
"epoch": 0.56,
"learning_rate": 9.727367367367368e-06,
"loss": 0.3501,
"step": 14125
},
{
"epoch": 0.56,
"learning_rate": 9.726866866866868e-06,
"loss": 0.3318,
"step": 14150
},
{
"epoch": 0.57,
"learning_rate": 9.726366366366367e-06,
"loss": 0.3655,
"step": 14175
},
{
"epoch": 0.57,
"learning_rate": 9.725865865865866e-06,
"loss": 0.3496,
"step": 14200
},
{
"epoch": 0.57,
"learning_rate": 9.725365365365366e-06,
"loss": 0.3379,
"step": 14225
},
{
"epoch": 0.57,
"learning_rate": 9.724884884884885e-06,
"loss": 0.3893,
"step": 14250
},
{
"epoch": 0.57,
"learning_rate": 9.724384384384386e-06,
"loss": 0.3703,
"step": 14275
},
{
"epoch": 0.57,
"learning_rate": 9.723883883883885e-06,
"loss": 0.3531,
"step": 14300
},
{
"epoch": 0.57,
"learning_rate": 9.723383383383384e-06,
"loss": 0.3604,
"step": 14325
},
{
"epoch": 0.57,
"learning_rate": 9.722882882882884e-06,
"loss": 0.3527,
"step": 14350
},
{
"epoch": 0.57,
"learning_rate": 9.722382382382383e-06,
"loss": 0.3556,
"step": 14375
},
{
"epoch": 0.57,
"learning_rate": 9.721881881881882e-06,
"loss": 0.3664,
"step": 14400
},
{
"epoch": 0.58,
"learning_rate": 9.721381381381382e-06,
"loss": 0.3641,
"step": 14425
},
{
"epoch": 0.58,
"learning_rate": 9.720880880880883e-06,
"loss": 0.3553,
"step": 14450
},
{
"epoch": 0.58,
"learning_rate": 9.72038038038038e-06,
"loss": 0.3605,
"step": 14475
},
{
"epoch": 0.58,
"learning_rate": 9.719879879879881e-06,
"loss": 0.3412,
"step": 14500
},
{
"epoch": 0.58,
"learning_rate": 9.71937937937938e-06,
"loss": 0.3588,
"step": 14525
},
{
"epoch": 0.58,
"learning_rate": 9.71887887887888e-06,
"loss": 0.3334,
"step": 14550
},
{
"epoch": 0.58,
"learning_rate": 9.718378378378379e-06,
"loss": 0.3624,
"step": 14575
},
{
"epoch": 0.58,
"learning_rate": 9.717877877877878e-06,
"loss": 0.3609,
"step": 14600
},
{
"epoch": 0.58,
"learning_rate": 9.717377377377378e-06,
"loss": 0.3339,
"step": 14625
},
{
"epoch": 0.58,
"learning_rate": 9.716876876876877e-06,
"loss": 0.353,
"step": 14650
},
{
"epoch": 0.59,
"learning_rate": 9.716376376376378e-06,
"loss": 0.3517,
"step": 14675
},
{
"epoch": 0.59,
"learning_rate": 9.715875875875877e-06,
"loss": 0.3626,
"step": 14700
},
{
"epoch": 0.59,
"learning_rate": 9.715375375375377e-06,
"loss": 0.3268,
"step": 14725
},
{
"epoch": 0.59,
"learning_rate": 9.714874874874876e-06,
"loss": 0.3648,
"step": 14750
},
{
"epoch": 0.59,
"learning_rate": 9.714374374374375e-06,
"loss": 0.3579,
"step": 14775
},
{
"epoch": 0.59,
"learning_rate": 9.713873873873874e-06,
"loss": 0.3403,
"step": 14800
},
{
"epoch": 0.59,
"learning_rate": 9.713373373373374e-06,
"loss": 0.3597,
"step": 14825
},
{
"epoch": 0.59,
"learning_rate": 9.712872872872873e-06,
"loss": 0.3323,
"step": 14850
},
{
"epoch": 0.59,
"learning_rate": 9.712372372372372e-06,
"loss": 0.3412,
"step": 14875
},
{
"epoch": 0.59,
"learning_rate": 9.711871871871873e-06,
"loss": 0.3574,
"step": 14900
},
{
"epoch": 0.6,
"learning_rate": 9.711371371371373e-06,
"loss": 0.348,
"step": 14925
},
{
"epoch": 0.6,
"learning_rate": 9.710870870870872e-06,
"loss": 0.3588,
"step": 14950
},
{
"epoch": 0.6,
"learning_rate": 9.710370370370371e-06,
"loss": 0.3445,
"step": 14975
},
{
"epoch": 0.6,
"learning_rate": 9.70986986986987e-06,
"loss": 0.3545,
"step": 15000
},
{
"epoch": 0.6,
"eval_loss": 0.5023101568222046,
"eval_runtime": 2571.7112,
"eval_samples_per_second": 6.304,
"eval_steps_per_second": 0.158,
"eval_wer": 30.215616592533205,
"step": 15000
},
{
"epoch": 0.6,
"learning_rate": 9.70936936936937e-06,
"loss": 0.3526,
"step": 15025
},
{
"epoch": 0.6,
"learning_rate": 9.708868868868869e-06,
"loss": 0.361,
"step": 15050
},
{
"epoch": 0.6,
"learning_rate": 9.70836836836837e-06,
"loss": 0.3731,
"step": 15075
},
{
"epoch": 0.6,
"learning_rate": 9.707867867867868e-06,
"loss": 0.3499,
"step": 15100
},
{
"epoch": 0.6,
"learning_rate": 9.707367367367369e-06,
"loss": 0.3608,
"step": 15125
},
{
"epoch": 0.6,
"learning_rate": 9.706866866866868e-06,
"loss": 0.3465,
"step": 15150
},
{
"epoch": 0.61,
"learning_rate": 9.706366366366367e-06,
"loss": 0.362,
"step": 15175
},
{
"epoch": 0.61,
"learning_rate": 9.705865865865867e-06,
"loss": 0.348,
"step": 15200
},
{
"epoch": 0.61,
"learning_rate": 9.705365365365366e-06,
"loss": 0.3532,
"step": 15225
},
{
"epoch": 0.61,
"learning_rate": 9.704864864864865e-06,
"loss": 0.3352,
"step": 15250
},
{
"epoch": 0.61,
"learning_rate": 9.704364364364364e-06,
"loss": 0.3424,
"step": 15275
},
{
"epoch": 0.61,
"learning_rate": 9.703863863863865e-06,
"loss": 0.3569,
"step": 15300
},
{
"epoch": 0.61,
"learning_rate": 9.703363363363365e-06,
"loss": 0.329,
"step": 15325
},
{
"epoch": 0.61,
"learning_rate": 9.702862862862864e-06,
"loss": 0.3551,
"step": 15350
},
{
"epoch": 0.61,
"learning_rate": 9.702362362362363e-06,
"loss": 0.3592,
"step": 15375
},
{
"epoch": 0.61,
"learning_rate": 9.701861861861863e-06,
"loss": 0.359,
"step": 15400
},
{
"epoch": 0.62,
"learning_rate": 9.701361361361362e-06,
"loss": 0.3498,
"step": 15425
},
{
"epoch": 0.62,
"learning_rate": 9.700860860860861e-06,
"loss": 0.352,
"step": 15450
},
{
"epoch": 0.62,
"learning_rate": 9.70036036036036e-06,
"loss": 0.3451,
"step": 15475
},
{
"epoch": 0.62,
"learning_rate": 9.69985985985986e-06,
"loss": 0.3582,
"step": 15500
},
{
"epoch": 0.62,
"learning_rate": 9.69935935935936e-06,
"loss": 0.3495,
"step": 15525
},
{
"epoch": 0.62,
"learning_rate": 9.69885885885886e-06,
"loss": 0.3603,
"step": 15550
},
{
"epoch": 0.62,
"learning_rate": 9.69835835835836e-06,
"loss": 0.3398,
"step": 15575
},
{
"epoch": 0.62,
"learning_rate": 9.697857857857859e-06,
"loss": 0.3532,
"step": 15600
},
{
"epoch": 0.62,
"learning_rate": 9.697357357357358e-06,
"loss": 0.3848,
"step": 15625
},
{
"epoch": 0.62,
"learning_rate": 9.696856856856857e-06,
"loss": 0.3341,
"step": 15650
},
{
"epoch": 0.63,
"learning_rate": 9.696356356356357e-06,
"loss": 0.37,
"step": 15675
},
{
"epoch": 0.63,
"learning_rate": 9.695855855855858e-06,
"loss": 0.3635,
"step": 15700
},
{
"epoch": 0.63,
"learning_rate": 9.695355355355355e-06,
"loss": 0.3614,
"step": 15725
},
{
"epoch": 0.63,
"learning_rate": 9.694854854854856e-06,
"loss": 0.3651,
"step": 15750
},
{
"epoch": 0.63,
"learning_rate": 9.694354354354355e-06,
"loss": 0.3733,
"step": 15775
},
{
"epoch": 0.63,
"learning_rate": 9.693853853853855e-06,
"loss": 0.3455,
"step": 15800
},
{
"epoch": 0.63,
"learning_rate": 9.693353353353354e-06,
"loss": 0.3551,
"step": 15825
},
{
"epoch": 0.63,
"learning_rate": 9.692852852852853e-06,
"loss": 0.3517,
"step": 15850
},
{
"epoch": 0.63,
"learning_rate": 9.692352352352353e-06,
"loss": 0.3595,
"step": 15875
},
{
"epoch": 0.63,
"learning_rate": 9.691851851851852e-06,
"loss": 0.3694,
"step": 15900
},
{
"epoch": 0.64,
"learning_rate": 9.691351351351353e-06,
"loss": 0.3433,
"step": 15925
},
{
"epoch": 0.64,
"learning_rate": 9.69085085085085e-06,
"loss": 0.3443,
"step": 15950
},
{
"epoch": 0.64,
"learning_rate": 9.690350350350352e-06,
"loss": 0.3754,
"step": 15975
},
{
"epoch": 0.64,
"learning_rate": 9.689849849849851e-06,
"loss": 0.369,
"step": 16000
},
{
"epoch": 0.64,
"eval_loss": 0.4858362674713135,
"eval_runtime": 2697.5515,
"eval_samples_per_second": 6.01,
"eval_steps_per_second": 0.151,
"eval_wer": 31.24320657410905,
"step": 16000
},
{
"epoch": 0.64,
"learning_rate": 9.68934934934935e-06,
"loss": 0.3536,
"step": 16025
},
{
"epoch": 0.64,
"learning_rate": 9.68884884884885e-06,
"loss": 0.339,
"step": 16050
},
{
"epoch": 0.64,
"learning_rate": 9.688348348348349e-06,
"loss": 0.3319,
"step": 16075
},
{
"epoch": 0.64,
"learning_rate": 9.687847847847848e-06,
"loss": 0.3742,
"step": 16100
},
{
"epoch": 0.64,
"learning_rate": 9.687347347347347e-06,
"loss": 0.3299,
"step": 16125
},
{
"epoch": 0.64,
"learning_rate": 9.686846846846848e-06,
"loss": 0.3526,
"step": 16150
},
{
"epoch": 0.65,
"learning_rate": 9.686346346346348e-06,
"loss": 0.3479,
"step": 16175
},
{
"epoch": 0.65,
"learning_rate": 9.685845845845847e-06,
"loss": 0.3631,
"step": 16200
},
{
"epoch": 0.65,
"learning_rate": 9.685345345345346e-06,
"loss": 0.3545,
"step": 16225
},
{
"epoch": 0.65,
"learning_rate": 9.684844844844846e-06,
"loss": 0.3651,
"step": 16250
},
{
"epoch": 0.65,
"learning_rate": 9.684344344344345e-06,
"loss": 0.3438,
"step": 16275
},
{
"epoch": 0.65,
"learning_rate": 9.683843843843844e-06,
"loss": 0.3502,
"step": 16300
},
{
"epoch": 0.65,
"learning_rate": 9.683343343343345e-06,
"loss": 0.357,
"step": 16325
},
{
"epoch": 0.65,
"learning_rate": 9.682842842842843e-06,
"loss": 0.349,
"step": 16350
},
{
"epoch": 0.65,
"learning_rate": 9.682342342342344e-06,
"loss": 0.3369,
"step": 16375
},
{
"epoch": 0.65,
"learning_rate": 9.681841841841843e-06,
"loss": 0.361,
"step": 16400
},
{
"epoch": 0.66,
"learning_rate": 9.681341341341342e-06,
"loss": 0.3435,
"step": 16425
},
{
"epoch": 0.66,
"learning_rate": 9.680840840840842e-06,
"loss": 0.3185,
"step": 16450
},
{
"epoch": 0.66,
"learning_rate": 9.680340340340341e-06,
"loss": 0.3341,
"step": 16475
},
{
"epoch": 0.66,
"learning_rate": 9.67983983983984e-06,
"loss": 0.3349,
"step": 16500
},
{
"epoch": 0.66,
"learning_rate": 9.67933933933934e-06,
"loss": 0.3453,
"step": 16525
},
{
"epoch": 0.66,
"learning_rate": 9.67883883883884e-06,
"loss": 0.3519,
"step": 16550
},
{
"epoch": 0.66,
"learning_rate": 9.678338338338338e-06,
"loss": 0.3529,
"step": 16575
},
{
"epoch": 0.66,
"learning_rate": 9.677857857857859e-06,
"loss": 0.3486,
"step": 16600
},
{
"epoch": 0.66,
"learning_rate": 9.677357357357358e-06,
"loss": 0.3424,
"step": 16625
},
{
"epoch": 0.66,
"learning_rate": 9.676856856856858e-06,
"loss": 0.3455,
"step": 16650
},
{
"epoch": 0.66,
"learning_rate": 9.676356356356357e-06,
"loss": 0.3431,
"step": 16675
},
{
"epoch": 0.67,
"learning_rate": 9.675855855855856e-06,
"loss": 0.3379,
"step": 16700
},
{
"epoch": 0.67,
"learning_rate": 9.675355355355355e-06,
"loss": 0.3539,
"step": 16725
},
{
"epoch": 0.67,
"learning_rate": 9.674854854854856e-06,
"loss": 0.327,
"step": 16750
},
{
"epoch": 0.67,
"learning_rate": 9.674354354354356e-06,
"loss": 0.3275,
"step": 16775
},
{
"epoch": 0.67,
"learning_rate": 9.673853853853855e-06,
"loss": 0.3396,
"step": 16800
},
{
"epoch": 0.67,
"learning_rate": 9.673353353353354e-06,
"loss": 0.3476,
"step": 16825
},
{
"epoch": 0.67,
"learning_rate": 9.672852852852854e-06,
"loss": 0.3675,
"step": 16850
},
{
"epoch": 0.67,
"learning_rate": 9.672352352352353e-06,
"loss": 0.3571,
"step": 16875
},
{
"epoch": 0.67,
"learning_rate": 9.671851851851852e-06,
"loss": 0.3463,
"step": 16900
},
{
"epoch": 0.67,
"learning_rate": 9.671351351351353e-06,
"loss": 0.3381,
"step": 16925
},
{
"epoch": 0.68,
"learning_rate": 9.67085085085085e-06,
"loss": 0.3582,
"step": 16950
},
{
"epoch": 0.68,
"learning_rate": 9.670350350350352e-06,
"loss": 0.3633,
"step": 16975
},
{
"epoch": 0.68,
"learning_rate": 9.669849849849851e-06,
"loss": 0.3585,
"step": 17000
},
{
"epoch": 0.68,
"eval_loss": 0.4826071560382843,
"eval_runtime": 2556.6287,
"eval_samples_per_second": 6.342,
"eval_steps_per_second": 0.159,
"eval_wer": 29.16952536597775,
"step": 17000
},
{
"epoch": 0.68,
"learning_rate": 9.66934934934935e-06,
"loss": 0.3504,
"step": 17025
},
{
"epoch": 0.68,
"learning_rate": 9.66884884884885e-06,
"loss": 0.3523,
"step": 17050
},
{
"epoch": 0.68,
"learning_rate": 9.668348348348349e-06,
"loss": 0.3572,
"step": 17075
},
{
"epoch": 0.68,
"learning_rate": 9.667847847847848e-06,
"loss": 0.364,
"step": 17100
},
{
"epoch": 0.68,
"learning_rate": 9.667347347347348e-06,
"loss": 0.3251,
"step": 17125
},
{
"epoch": 0.68,
"learning_rate": 9.666846846846849e-06,
"loss": 0.3318,
"step": 17150
},
{
"epoch": 0.68,
"learning_rate": 9.666346346346346e-06,
"loss": 0.3456,
"step": 17175
},
{
"epoch": 0.69,
"learning_rate": 9.665845845845847e-06,
"loss": 0.345,
"step": 17200
},
{
"epoch": 0.69,
"learning_rate": 9.665345345345346e-06,
"loss": 0.3224,
"step": 17225
},
{
"epoch": 0.69,
"learning_rate": 9.664844844844846e-06,
"loss": 0.3397,
"step": 17250
},
{
"epoch": 0.69,
"learning_rate": 9.664344344344345e-06,
"loss": 0.3484,
"step": 17275
},
{
"epoch": 0.69,
"learning_rate": 9.663843843843844e-06,
"loss": 0.3267,
"step": 17300
},
{
"epoch": 0.69,
"learning_rate": 9.663343343343344e-06,
"loss": 0.3642,
"step": 17325
},
{
"epoch": 0.69,
"learning_rate": 9.662842842842843e-06,
"loss": 0.3447,
"step": 17350
},
{
"epoch": 0.69,
"learning_rate": 9.662342342342344e-06,
"loss": 0.3429,
"step": 17375
},
{
"epoch": 0.69,
"learning_rate": 9.661841841841843e-06,
"loss": 0.3258,
"step": 17400
},
{
"epoch": 0.69,
"learning_rate": 9.661341341341343e-06,
"loss": 0.3305,
"step": 17425
},
{
"epoch": 0.7,
"learning_rate": 9.660840840840842e-06,
"loss": 0.3376,
"step": 17450
},
{
"epoch": 0.7,
"learning_rate": 9.660340340340341e-06,
"loss": 0.3417,
"step": 17475
},
{
"epoch": 0.7,
"learning_rate": 9.65983983983984e-06,
"loss": 0.3326,
"step": 17500
},
{
"epoch": 0.7,
"learning_rate": 9.65933933933934e-06,
"loss": 0.334,
"step": 17525
},
{
"epoch": 0.7,
"learning_rate": 9.65883883883884e-06,
"loss": 0.3461,
"step": 17550
},
{
"epoch": 0.7,
"learning_rate": 9.658338338338338e-06,
"loss": 0.3512,
"step": 17575
},
{
"epoch": 0.7,
"learning_rate": 9.65783783783784e-06,
"loss": 0.3609,
"step": 17600
},
{
"epoch": 0.7,
"learning_rate": 9.657337337337339e-06,
"loss": 0.3502,
"step": 17625
},
{
"epoch": 0.7,
"learning_rate": 9.656836836836838e-06,
"loss": 0.3508,
"step": 17650
},
{
"epoch": 0.7,
"learning_rate": 9.656336336336337e-06,
"loss": 0.3436,
"step": 17675
},
{
"epoch": 0.71,
"learning_rate": 9.655835835835836e-06,
"loss": 0.3525,
"step": 17700
},
{
"epoch": 0.71,
"learning_rate": 9.655335335335336e-06,
"loss": 0.339,
"step": 17725
},
{
"epoch": 0.71,
"learning_rate": 9.654834834834835e-06,
"loss": 0.3507,
"step": 17750
},
{
"epoch": 0.71,
"learning_rate": 9.654334334334336e-06,
"loss": 0.3277,
"step": 17775
},
{
"epoch": 0.71,
"learning_rate": 9.653833833833834e-06,
"loss": 0.3486,
"step": 17800
},
{
"epoch": 0.71,
"learning_rate": 9.653353353353354e-06,
"loss": 0.3529,
"step": 17825
},
{
"epoch": 0.71,
"learning_rate": 9.652852852852854e-06,
"loss": 0.3228,
"step": 17850
},
{
"epoch": 0.71,
"learning_rate": 9.652352352352353e-06,
"loss": 0.335,
"step": 17875
},
{
"epoch": 0.71,
"learning_rate": 9.651851851851852e-06,
"loss": 0.3641,
"step": 17900
},
{
"epoch": 0.71,
"learning_rate": 9.651351351351352e-06,
"loss": 0.3248,
"step": 17925
},
{
"epoch": 0.72,
"learning_rate": 9.650850850850851e-06,
"loss": 0.3308,
"step": 17950
},
{
"epoch": 0.72,
"learning_rate": 9.650350350350352e-06,
"loss": 0.333,
"step": 17975
},
{
"epoch": 0.72,
"learning_rate": 9.649849849849851e-06,
"loss": 0.3302,
"step": 18000
},
{
"epoch": 0.72,
"eval_loss": 0.4842660427093506,
"eval_runtime": 2644.843,
"eval_samples_per_second": 6.13,
"eval_steps_per_second": 0.154,
"eval_wer": 29.56498947741692,
"step": 18000
},
{
"epoch": 0.72,
"learning_rate": 9.64934934934935e-06,
"loss": 0.3624,
"step": 18025
},
{
"epoch": 0.72,
"learning_rate": 9.64884884884885e-06,
"loss": 0.3645,
"step": 18050
},
{
"epoch": 0.72,
"learning_rate": 9.648348348348349e-06,
"loss": 0.3563,
"step": 18075
},
{
"epoch": 0.72,
"learning_rate": 9.647847847847848e-06,
"loss": 0.3354,
"step": 18100
},
{
"epoch": 0.72,
"learning_rate": 9.647347347347348e-06,
"loss": 0.3352,
"step": 18125
},
{
"epoch": 0.72,
"learning_rate": 9.646846846846849e-06,
"loss": 0.3426,
"step": 18150
},
{
"epoch": 0.72,
"learning_rate": 9.646346346346346e-06,
"loss": 0.3534,
"step": 18175
},
{
"epoch": 0.73,
"learning_rate": 9.645845845845847e-06,
"loss": 0.3316,
"step": 18200
},
{
"epoch": 0.73,
"learning_rate": 9.645345345345347e-06,
"loss": 0.3387,
"step": 18225
},
{
"epoch": 0.73,
"learning_rate": 9.644844844844846e-06,
"loss": 0.3489,
"step": 18250
},
{
"epoch": 0.73,
"learning_rate": 9.644344344344345e-06,
"loss": 0.3339,
"step": 18275
},
{
"epoch": 0.73,
"learning_rate": 9.643843843843845e-06,
"loss": 0.3416,
"step": 18300
},
{
"epoch": 0.73,
"learning_rate": 9.643343343343344e-06,
"loss": 0.3259,
"step": 18325
},
{
"epoch": 0.73,
"learning_rate": 9.642842842842843e-06,
"loss": 0.3476,
"step": 18350
},
{
"epoch": 0.73,
"learning_rate": 9.642342342342344e-06,
"loss": 0.3499,
"step": 18375
},
{
"epoch": 0.73,
"learning_rate": 9.641841841841842e-06,
"loss": 0.3438,
"step": 18400
},
{
"epoch": 0.73,
"learning_rate": 9.641341341341343e-06,
"loss": 0.3316,
"step": 18425
},
{
"epoch": 0.74,
"learning_rate": 9.640840840840842e-06,
"loss": 0.3397,
"step": 18450
},
{
"epoch": 0.74,
"learning_rate": 9.640340340340341e-06,
"loss": 0.3281,
"step": 18475
},
{
"epoch": 0.74,
"learning_rate": 9.63983983983984e-06,
"loss": 0.3316,
"step": 18500
},
{
"epoch": 0.74,
"learning_rate": 9.63933933933934e-06,
"loss": 0.3487,
"step": 18525
},
{
"epoch": 0.74,
"learning_rate": 9.63883883883884e-06,
"loss": 0.3273,
"step": 18550
},
{
"epoch": 0.74,
"learning_rate": 9.638338338338338e-06,
"loss": 0.3522,
"step": 18575
},
{
"epoch": 0.74,
"learning_rate": 9.63783783783784e-06,
"loss": 0.3261,
"step": 18600
},
{
"epoch": 0.74,
"learning_rate": 9.637337337337339e-06,
"loss": 0.3551,
"step": 18625
},
{
"epoch": 0.74,
"learning_rate": 9.636836836836838e-06,
"loss": 0.343,
"step": 18650
},
{
"epoch": 0.74,
"learning_rate": 9.636336336336337e-06,
"loss": 0.3302,
"step": 18675
},
{
"epoch": 0.75,
"learning_rate": 9.635835835835837e-06,
"loss": 0.3287,
"step": 18700
},
{
"epoch": 0.75,
"learning_rate": 9.635335335335336e-06,
"loss": 0.3317,
"step": 18725
},
{
"epoch": 0.75,
"learning_rate": 9.634834834834835e-06,
"loss": 0.3346,
"step": 18750
},
{
"epoch": 0.75,
"learning_rate": 9.634334334334336e-06,
"loss": 0.3531,
"step": 18775
},
{
"epoch": 0.75,
"learning_rate": 9.633833833833834e-06,
"loss": 0.35,
"step": 18800
},
{
"epoch": 0.75,
"learning_rate": 9.633333333333335e-06,
"loss": 0.3407,
"step": 18825
},
{
"epoch": 0.75,
"learning_rate": 9.632832832832834e-06,
"loss": 0.3193,
"step": 18850
},
{
"epoch": 0.75,
"learning_rate": 9.632332332332333e-06,
"loss": 0.351,
"step": 18875
},
{
"epoch": 0.75,
"learning_rate": 9.631831831831833e-06,
"loss": 0.3554,
"step": 18900
},
{
"epoch": 0.75,
"learning_rate": 9.631331331331332e-06,
"loss": 0.3389,
"step": 18925
},
{
"epoch": 0.76,
"learning_rate": 9.630830830830831e-06,
"loss": 0.3196,
"step": 18950
},
{
"epoch": 0.76,
"learning_rate": 9.63033033033033e-06,
"loss": 0.3271,
"step": 18975
},
{
"epoch": 0.76,
"learning_rate": 9.629829829829832e-06,
"loss": 0.3252,
"step": 19000
},
{
"epoch": 0.76,
"eval_loss": 0.4709344506263733,
"eval_runtime": 2536.9152,
"eval_samples_per_second": 6.391,
"eval_steps_per_second": 0.16,
"eval_wer": 28.698514504205182,
"step": 19000
},
{
"epoch": 0.76,
"learning_rate": 9.62932932932933e-06,
"loss": 0.3142,
"step": 19025
},
{
"epoch": 0.76,
"learning_rate": 9.62882882882883e-06,
"loss": 0.3346,
"step": 19050
},
{
"epoch": 0.76,
"learning_rate": 9.62832832832833e-06,
"loss": 0.3582,
"step": 19075
},
{
"epoch": 0.76,
"learning_rate": 9.627827827827829e-06,
"loss": 0.327,
"step": 19100
},
{
"epoch": 0.76,
"learning_rate": 9.627327327327328e-06,
"loss": 0.3347,
"step": 19125
},
{
"epoch": 0.76,
"learning_rate": 9.626826826826827e-06,
"loss": 0.3509,
"step": 19150
},
{
"epoch": 0.76,
"learning_rate": 9.626326326326327e-06,
"loss": 0.3349,
"step": 19175
},
{
"epoch": 0.77,
"learning_rate": 9.625825825825826e-06,
"loss": 0.335,
"step": 19200
},
{
"epoch": 0.77,
"learning_rate": 9.625325325325327e-06,
"loss": 0.3371,
"step": 19225
},
{
"epoch": 0.77,
"learning_rate": 9.624824824824826e-06,
"loss": 0.3475,
"step": 19250
},
{
"epoch": 0.77,
"learning_rate": 9.624324324324326e-06,
"loss": 0.3428,
"step": 19275
},
{
"epoch": 0.77,
"learning_rate": 9.623823823823825e-06,
"loss": 0.3375,
"step": 19300
},
{
"epoch": 0.77,
"learning_rate": 9.623323323323324e-06,
"loss": 0.335,
"step": 19325
},
{
"epoch": 0.77,
"learning_rate": 9.622822822822823e-06,
"loss": 0.3488,
"step": 19350
},
{
"epoch": 0.77,
"learning_rate": 9.622322322322323e-06,
"loss": 0.3255,
"step": 19375
},
{
"epoch": 0.77,
"learning_rate": 9.621821821821822e-06,
"loss": 0.3419,
"step": 19400
},
{
"epoch": 0.77,
"learning_rate": 9.621321321321321e-06,
"loss": 0.3257,
"step": 19425
},
{
"epoch": 0.78,
"learning_rate": 9.620820820820822e-06,
"loss": 0.337,
"step": 19450
},
{
"epoch": 0.78,
"learning_rate": 9.620320320320322e-06,
"loss": 0.3159,
"step": 19475
},
{
"epoch": 0.78,
"learning_rate": 9.619819819819821e-06,
"loss": 0.336,
"step": 19500
},
{
"epoch": 0.78,
"learning_rate": 9.61931931931932e-06,
"loss": 0.3218,
"step": 19525
},
{
"epoch": 0.78,
"learning_rate": 9.61881881881882e-06,
"loss": 0.3447,
"step": 19550
},
{
"epoch": 0.78,
"learning_rate": 9.618318318318319e-06,
"loss": 0.3395,
"step": 19575
},
{
"epoch": 0.78,
"learning_rate": 9.617817817817818e-06,
"loss": 0.3237,
"step": 19600
},
{
"epoch": 0.78,
"learning_rate": 9.617317317317319e-06,
"loss": 0.331,
"step": 19625
},
{
"epoch": 0.78,
"learning_rate": 9.616816816816817e-06,
"loss": 0.3152,
"step": 19650
},
{
"epoch": 0.78,
"learning_rate": 9.616316316316318e-06,
"loss": 0.3391,
"step": 19675
},
{
"epoch": 0.79,
"learning_rate": 9.615815815815817e-06,
"loss": 0.3293,
"step": 19700
},
{
"epoch": 0.79,
"learning_rate": 9.615315315315316e-06,
"loss": 0.3322,
"step": 19725
},
{
"epoch": 0.79,
"learning_rate": 9.614814814814816e-06,
"loss": 0.3294,
"step": 19750
},
{
"epoch": 0.79,
"learning_rate": 9.614314314314315e-06,
"loss": 0.334,
"step": 19775
},
{
"epoch": 0.79,
"learning_rate": 9.613813813813814e-06,
"loss": 0.3418,
"step": 19800
},
{
"epoch": 0.79,
"learning_rate": 9.613313313313314e-06,
"loss": 0.3456,
"step": 19825
},
{
"epoch": 0.79,
"learning_rate": 9.612812812812815e-06,
"loss": 0.3513,
"step": 19850
},
{
"epoch": 0.79,
"learning_rate": 9.612312312312314e-06,
"loss": 0.3395,
"step": 19875
},
{
"epoch": 0.79,
"learning_rate": 9.611811811811813e-06,
"loss": 0.3478,
"step": 19900
},
{
"epoch": 0.79,
"learning_rate": 9.611311311311312e-06,
"loss": 0.3278,
"step": 19925
},
{
"epoch": 0.8,
"learning_rate": 9.610810810810812e-06,
"loss": 0.3012,
"step": 19950
},
{
"epoch": 0.8,
"learning_rate": 9.610310310310311e-06,
"loss": 0.3453,
"step": 19975
},
{
"epoch": 0.8,
"learning_rate": 9.60980980980981e-06,
"loss": 0.3453,
"step": 20000
},
{
"epoch": 0.8,
"eval_loss": 0.471629798412323,
"eval_runtime": 2478.9552,
"eval_samples_per_second": 6.54,
"eval_steps_per_second": 0.164,
"eval_wer": 27.84051926827576,
"step": 20000
},
{
"epoch": 0.8,
"learning_rate": 9.60930930930931e-06,
"loss": 0.3442,
"step": 20025
},
{
"epoch": 0.8,
"learning_rate": 9.608808808808809e-06,
"loss": 0.3431,
"step": 20050
},
{
"epoch": 0.8,
"learning_rate": 9.60830830830831e-06,
"loss": 0.3146,
"step": 20075
},
{
"epoch": 0.8,
"learning_rate": 9.60780780780781e-06,
"loss": 0.3474,
"step": 20100
},
{
"epoch": 0.8,
"learning_rate": 9.607307307307307e-06,
"loss": 0.3335,
"step": 20125
},
{
"epoch": 0.8,
"learning_rate": 9.606806806806808e-06,
"loss": 0.3374,
"step": 20150
},
{
"epoch": 0.8,
"learning_rate": 9.606306306306307e-06,
"loss": 0.3235,
"step": 20175
},
{
"epoch": 0.81,
"learning_rate": 9.605805805805806e-06,
"loss": 0.339,
"step": 20200
},
{
"epoch": 0.81,
"learning_rate": 9.605305305305306e-06,
"loss": 0.3468,
"step": 20225
},
{
"epoch": 0.81,
"learning_rate": 9.604804804804807e-06,
"loss": 0.3587,
"step": 20250
},
{
"epoch": 0.81,
"learning_rate": 9.604304304304304e-06,
"loss": 0.3113,
"step": 20275
},
{
"epoch": 0.81,
"learning_rate": 9.603803803803805e-06,
"loss": 0.3224,
"step": 20300
},
{
"epoch": 0.81,
"learning_rate": 9.603303303303305e-06,
"loss": 0.3298,
"step": 20325
},
{
"epoch": 0.81,
"learning_rate": 9.602802802802804e-06,
"loss": 0.3489,
"step": 20350
},
{
"epoch": 0.81,
"learning_rate": 9.602302302302303e-06,
"loss": 0.2943,
"step": 20375
},
{
"epoch": 0.81,
"learning_rate": 9.601801801801802e-06,
"loss": 0.3283,
"step": 20400
},
{
"epoch": 0.81,
"learning_rate": 9.601301301301302e-06,
"loss": 0.3167,
"step": 20425
},
{
"epoch": 0.82,
"learning_rate": 9.600800800800801e-06,
"loss": 0.3427,
"step": 20450
},
{
"epoch": 0.82,
"learning_rate": 9.600300300300302e-06,
"loss": 0.3538,
"step": 20475
},
{
"epoch": 0.82,
"learning_rate": 9.599799799799801e-06,
"loss": 0.3353,
"step": 20500
},
{
"epoch": 0.82,
"learning_rate": 9.5992992992993e-06,
"loss": 0.3427,
"step": 20525
},
{
"epoch": 0.82,
"learning_rate": 9.5987987987988e-06,
"loss": 0.3349,
"step": 20550
},
{
"epoch": 0.82,
"learning_rate": 9.5982982982983e-06,
"loss": 0.334,
"step": 20575
},
{
"epoch": 0.82,
"learning_rate": 9.597797797797799e-06,
"loss": 0.3281,
"step": 20600
},
{
"epoch": 0.82,
"learning_rate": 9.597297297297298e-06,
"loss": 0.3231,
"step": 20625
},
{
"epoch": 0.82,
"learning_rate": 9.596796796796797e-06,
"loss": 0.336,
"step": 20650
},
{
"epoch": 0.82,
"learning_rate": 9.596296296296296e-06,
"loss": 0.3208,
"step": 20675
},
{
"epoch": 0.83,
"learning_rate": 9.595795795795797e-06,
"loss": 0.3261,
"step": 20700
},
{
"epoch": 0.83,
"learning_rate": 9.595295295295297e-06,
"loss": 0.3354,
"step": 20725
},
{
"epoch": 0.83,
"learning_rate": 9.594794794794794e-06,
"loss": 0.3311,
"step": 20750
},
{
"epoch": 0.83,
"learning_rate": 9.594294294294295e-06,
"loss": 0.3372,
"step": 20775
},
{
"epoch": 0.83,
"learning_rate": 9.593793793793795e-06,
"loss": 0.3263,
"step": 20800
},
{
"epoch": 0.83,
"learning_rate": 9.593293293293294e-06,
"loss": 0.3187,
"step": 20825
},
{
"epoch": 0.83,
"learning_rate": 9.592792792792793e-06,
"loss": 0.317,
"step": 20850
},
{
"epoch": 0.83,
"learning_rate": 9.592292292292294e-06,
"loss": 0.3428,
"step": 20875
},
{
"epoch": 0.83,
"learning_rate": 9.591791791791792e-06,
"loss": 0.3049,
"step": 20900
},
{
"epoch": 0.83,
"learning_rate": 9.591291291291293e-06,
"loss": 0.3125,
"step": 20925
},
{
"epoch": 0.84,
"learning_rate": 9.590790790790792e-06,
"loss": 0.3206,
"step": 20950
},
{
"epoch": 0.84,
"learning_rate": 9.590290290290291e-06,
"loss": 0.3515,
"step": 20975
},
{
"epoch": 0.84,
"learning_rate": 9.58978978978979e-06,
"loss": 0.3412,
"step": 21000
},
{
"epoch": 0.84,
"eval_loss": 0.4714227020740509,
"eval_runtime": 2637.8451,
"eval_samples_per_second": 6.146,
"eval_steps_per_second": 0.154,
"eval_wer": 29.17954687367504,
"step": 21000
},
{
"epoch": 0.84,
"learning_rate": 9.58928928928929e-06,
"loss": 0.3176,
"step": 21025
},
{
"epoch": 0.84,
"learning_rate": 9.58878878878879e-06,
"loss": 0.3355,
"step": 21050
},
{
"epoch": 0.84,
"learning_rate": 9.588288288288289e-06,
"loss": 0.3306,
"step": 21075
},
{
"epoch": 0.84,
"learning_rate": 9.58778778778779e-06,
"loss": 0.3532,
"step": 21100
},
{
"epoch": 0.84,
"learning_rate": 9.587287287287287e-06,
"loss": 0.3311,
"step": 21125
},
{
"epoch": 0.84,
"learning_rate": 9.586786786786788e-06,
"loss": 0.3377,
"step": 21150
},
{
"epoch": 0.84,
"learning_rate": 9.586286286286287e-06,
"loss": 0.3171,
"step": 21175
},
{
"epoch": 0.85,
"learning_rate": 9.585785785785787e-06,
"loss": 0.3454,
"step": 21200
},
{
"epoch": 0.85,
"learning_rate": 9.585285285285286e-06,
"loss": 0.311,
"step": 21225
},
{
"epoch": 0.85,
"learning_rate": 9.584784784784785e-06,
"loss": 0.3303,
"step": 21250
},
{
"epoch": 0.85,
"learning_rate": 9.584284284284285e-06,
"loss": 0.3204,
"step": 21275
},
{
"epoch": 0.85,
"learning_rate": 9.583783783783784e-06,
"loss": 0.3104,
"step": 21300
},
{
"epoch": 0.85,
"learning_rate": 9.583283283283285e-06,
"loss": 0.3244,
"step": 21325
},
{
"epoch": 0.85,
"learning_rate": 9.582782782782784e-06,
"loss": 0.3192,
"step": 21350
},
{
"epoch": 0.85,
"learning_rate": 9.582282282282282e-06,
"loss": 0.3238,
"step": 21375
},
{
"epoch": 0.85,
"learning_rate": 9.581781781781783e-06,
"loss": 0.3298,
"step": 21400
},
{
"epoch": 0.85,
"learning_rate": 9.581281281281282e-06,
"loss": 0.3223,
"step": 21425
},
{
"epoch": 0.86,
"learning_rate": 9.580780780780781e-06,
"loss": 0.3576,
"step": 21450
},
{
"epoch": 0.86,
"learning_rate": 9.58028028028028e-06,
"loss": 0.305,
"step": 21475
},
{
"epoch": 0.86,
"learning_rate": 9.579779779779782e-06,
"loss": 0.3287,
"step": 21500
},
{
"epoch": 0.86,
"learning_rate": 9.57927927927928e-06,
"loss": 0.3372,
"step": 21525
},
{
"epoch": 0.86,
"learning_rate": 9.57877877877878e-06,
"loss": 0.3142,
"step": 21550
},
{
"epoch": 0.86,
"learning_rate": 9.57827827827828e-06,
"loss": 0.3222,
"step": 21575
},
{
"epoch": 0.86,
"learning_rate": 9.577777777777779e-06,
"loss": 0.3413,
"step": 21600
},
{
"epoch": 0.86,
"learning_rate": 9.577277277277278e-06,
"loss": 0.3194,
"step": 21625
},
{
"epoch": 0.86,
"learning_rate": 9.576776776776777e-06,
"loss": 0.3226,
"step": 21650
},
{
"epoch": 0.86,
"learning_rate": 9.576276276276277e-06,
"loss": 0.3162,
"step": 21675
},
{
"epoch": 0.87,
"learning_rate": 9.575775775775776e-06,
"loss": 0.3097,
"step": 21700
},
{
"epoch": 0.87,
"learning_rate": 9.575275275275277e-06,
"loss": 0.3366,
"step": 21725
},
{
"epoch": 0.87,
"learning_rate": 9.574774774774775e-06,
"loss": 0.322,
"step": 21750
},
{
"epoch": 0.87,
"learning_rate": 9.574274274274276e-06,
"loss": 0.3407,
"step": 21775
},
{
"epoch": 0.87,
"learning_rate": 9.573773773773775e-06,
"loss": 0.325,
"step": 21800
},
{
"epoch": 0.87,
"learning_rate": 9.573273273273274e-06,
"loss": 0.319,
"step": 21825
},
{
"epoch": 0.87,
"learning_rate": 9.572772772772774e-06,
"loss": 0.318,
"step": 21850
},
{
"epoch": 0.87,
"learning_rate": 9.572272272272273e-06,
"loss": 0.3029,
"step": 21875
},
{
"epoch": 0.87,
"learning_rate": 9.571771771771772e-06,
"loss": 0.3398,
"step": 21900
},
{
"epoch": 0.87,
"learning_rate": 9.571271271271271e-06,
"loss": 0.345,
"step": 21925
},
{
"epoch": 0.88,
"learning_rate": 9.570770770770772e-06,
"loss": 0.3366,
"step": 21950
},
{
"epoch": 0.88,
"learning_rate": 9.570270270270272e-06,
"loss": 0.3192,
"step": 21975
},
{
"epoch": 0.88,
"learning_rate": 9.56976976976977e-06,
"loss": 0.3221,
"step": 22000
},
{
"epoch": 0.88,
"eval_loss": 0.4648185670375824,
"eval_runtime": 2509.1979,
"eval_samples_per_second": 6.461,
"eval_steps_per_second": 0.162,
"eval_wer": 27.938421689626196,
"step": 22000
},
{
"epoch": 0.88,
"learning_rate": 9.56926926926927e-06,
"loss": 0.3333,
"step": 22025
},
{
"epoch": 0.88,
"learning_rate": 9.56876876876877e-06,
"loss": 0.3309,
"step": 22050
},
{
"epoch": 0.88,
"learning_rate": 9.568268268268269e-06,
"loss": 0.3252,
"step": 22075
},
{
"epoch": 0.88,
"learning_rate": 9.567767767767768e-06,
"loss": 0.339,
"step": 22100
},
{
"epoch": 0.88,
"learning_rate": 9.56726726726727e-06,
"loss": 0.3185,
"step": 22125
},
{
"epoch": 0.88,
"learning_rate": 9.566766766766767e-06,
"loss": 0.3312,
"step": 22150
},
{
"epoch": 0.88,
"learning_rate": 9.566266266266268e-06,
"loss": 0.3279,
"step": 22175
},
{
"epoch": 0.89,
"learning_rate": 9.565765765765767e-06,
"loss": 0.3111,
"step": 22200
},
{
"epoch": 0.89,
"learning_rate": 9.565265265265266e-06,
"loss": 0.3294,
"step": 22225
},
{
"epoch": 0.89,
"learning_rate": 9.564764764764766e-06,
"loss": 0.3359,
"step": 22250
},
{
"epoch": 0.89,
"learning_rate": 9.564264264264265e-06,
"loss": 0.3324,
"step": 22275
},
{
"epoch": 0.89,
"learning_rate": 9.563763763763764e-06,
"loss": 0.3331,
"step": 22300
},
{
"epoch": 0.89,
"learning_rate": 9.563263263263264e-06,
"loss": 0.3331,
"step": 22325
},
{
"epoch": 0.89,
"learning_rate": 9.562762762762765e-06,
"loss": 0.307,
"step": 22350
},
{
"epoch": 0.89,
"learning_rate": 9.562262262262262e-06,
"loss": 0.3384,
"step": 22375
},
{
"epoch": 0.89,
"learning_rate": 9.561761761761763e-06,
"loss": 0.3291,
"step": 22400
},
{
"epoch": 0.89,
"learning_rate": 9.561261261261262e-06,
"loss": 0.3411,
"step": 22425
},
{
"epoch": 0.9,
"learning_rate": 9.560760760760762e-06,
"loss": 0.3141,
"step": 22450
},
{
"epoch": 0.9,
"learning_rate": 9.560260260260261e-06,
"loss": 0.3289,
"step": 22475
},
{
"epoch": 0.9,
"learning_rate": 9.55975975975976e-06,
"loss": 0.3289,
"step": 22500
},
{
"epoch": 0.9,
"learning_rate": 9.55925925925926e-06,
"loss": 0.2942,
"step": 22525
},
{
"epoch": 0.9,
"learning_rate": 9.558758758758759e-06,
"loss": 0.3307,
"step": 22550
},
{
"epoch": 0.9,
"learning_rate": 9.55825825825826e-06,
"loss": 0.3565,
"step": 22575
},
{
"epoch": 0.9,
"learning_rate": 9.55775775775776e-06,
"loss": 0.3065,
"step": 22600
},
{
"epoch": 0.9,
"learning_rate": 9.557257257257257e-06,
"loss": 0.3128,
"step": 22625
},
{
"epoch": 0.9,
"learning_rate": 9.556756756756758e-06,
"loss": 0.3181,
"step": 22650
},
{
"epoch": 0.9,
"learning_rate": 9.556256256256257e-06,
"loss": 0.321,
"step": 22675
},
{
"epoch": 0.91,
"learning_rate": 9.555755755755756e-06,
"loss": 0.3305,
"step": 22700
},
{
"epoch": 0.91,
"learning_rate": 9.555255255255256e-06,
"loss": 0.3454,
"step": 22725
},
{
"epoch": 0.91,
"learning_rate": 9.554754754754757e-06,
"loss": 0.3236,
"step": 22750
},
{
"epoch": 0.91,
"learning_rate": 9.554254254254254e-06,
"loss": 0.3345,
"step": 22775
},
{
"epoch": 0.91,
"learning_rate": 9.553753753753755e-06,
"loss": 0.3221,
"step": 22800
},
{
"epoch": 0.91,
"learning_rate": 9.553253253253255e-06,
"loss": 0.3333,
"step": 22825
},
{
"epoch": 0.91,
"learning_rate": 9.552752752752752e-06,
"loss": 0.3176,
"step": 22850
},
{
"epoch": 0.91,
"learning_rate": 9.552252252252253e-06,
"loss": 0.3286,
"step": 22875
},
{
"epoch": 0.91,
"learning_rate": 9.551751751751753e-06,
"loss": 0.3165,
"step": 22900
},
{
"epoch": 0.91,
"learning_rate": 9.551251251251252e-06,
"loss": 0.3312,
"step": 22925
},
{
"epoch": 0.92,
"learning_rate": 9.550750750750751e-06,
"loss": 0.3334,
"step": 22950
},
{
"epoch": 0.92,
"learning_rate": 9.550250250250252e-06,
"loss": 0.3092,
"step": 22975
},
{
"epoch": 0.92,
"learning_rate": 9.54974974974975e-06,
"loss": 0.322,
"step": 23000
},
{
"epoch": 0.92,
"eval_loss": 0.46254613995552063,
"eval_runtime": 2464.8795,
"eval_samples_per_second": 6.578,
"eval_steps_per_second": 0.165,
"eval_wer": 27.390322307105247,
"step": 23000
},
{
"epoch": 0.92,
"learning_rate": 9.54924924924925e-06,
"loss": 0.3245,
"step": 23025
},
{
"epoch": 0.92,
"learning_rate": 9.54874874874875e-06,
"loss": 0.3263,
"step": 23050
},
{
"epoch": 0.92,
"learning_rate": 9.54824824824825e-06,
"loss": 0.3246,
"step": 23075
},
{
"epoch": 0.92,
"learning_rate": 9.547747747747749e-06,
"loss": 0.3407,
"step": 23100
},
{
"epoch": 0.92,
"learning_rate": 9.547247247247248e-06,
"loss": 0.3116,
"step": 23125
},
{
"epoch": 0.92,
"learning_rate": 9.546746746746747e-06,
"loss": 0.3278,
"step": 23150
},
{
"epoch": 0.92,
"learning_rate": 9.546246246246246e-06,
"loss": 0.3369,
"step": 23175
},
{
"epoch": 0.93,
"learning_rate": 9.545745745745747e-06,
"loss": 0.3133,
"step": 23200
},
{
"epoch": 0.93,
"learning_rate": 9.545245245245247e-06,
"loss": 0.3112,
"step": 23225
},
{
"epoch": 0.93,
"learning_rate": 9.544744744744744e-06,
"loss": 0.3316,
"step": 23250
},
{
"epoch": 0.93,
"learning_rate": 9.544244244244245e-06,
"loss": 0.3266,
"step": 23275
},
{
"epoch": 0.93,
"learning_rate": 9.543743743743745e-06,
"loss": 0.3237,
"step": 23300
},
{
"epoch": 0.93,
"learning_rate": 9.543243243243244e-06,
"loss": 0.3073,
"step": 23325
},
{
"epoch": 0.93,
"learning_rate": 9.542742742742743e-06,
"loss": 0.3326,
"step": 23350
},
{
"epoch": 0.93,
"learning_rate": 9.542242242242243e-06,
"loss": 0.3063,
"step": 23375
},
{
"epoch": 0.93,
"learning_rate": 9.541741741741742e-06,
"loss": 0.3145,
"step": 23400
},
{
"epoch": 0.93,
"learning_rate": 9.541241241241243e-06,
"loss": 0.3329,
"step": 23425
},
{
"epoch": 0.94,
"learning_rate": 9.540740740740742e-06,
"loss": 0.3285,
"step": 23450
},
{
"epoch": 0.94,
"learning_rate": 9.54024024024024e-06,
"loss": 0.3312,
"step": 23475
},
{
"epoch": 0.94,
"learning_rate": 9.53973973973974e-06,
"loss": 0.3203,
"step": 23500
},
{
"epoch": 0.94,
"learning_rate": 9.53923923923924e-06,
"loss": 0.327,
"step": 23525
},
{
"epoch": 0.94,
"learning_rate": 9.53873873873874e-06,
"loss": 0.3136,
"step": 23550
},
{
"epoch": 0.94,
"learning_rate": 9.538238238238239e-06,
"loss": 0.314,
"step": 23575
},
{
"epoch": 0.94,
"learning_rate": 9.53773773773774e-06,
"loss": 0.3294,
"step": 23600
},
{
"epoch": 0.94,
"learning_rate": 9.537237237237237e-06,
"loss": 0.3331,
"step": 23625
},
{
"epoch": 0.94,
"learning_rate": 9.536736736736738e-06,
"loss": 0.3112,
"step": 23650
},
{
"epoch": 0.94,
"learning_rate": 9.536236236236237e-06,
"loss": 0.3047,
"step": 23675
},
{
"epoch": 0.95,
"learning_rate": 9.535735735735737e-06,
"loss": 0.3153,
"step": 23700
},
{
"epoch": 0.95,
"learning_rate": 9.535235235235236e-06,
"loss": 0.3195,
"step": 23725
},
{
"epoch": 0.95,
"learning_rate": 9.534734734734735e-06,
"loss": 0.3187,
"step": 23750
},
{
"epoch": 0.95,
"learning_rate": 9.534234234234235e-06,
"loss": 0.3351,
"step": 23775
},
{
"epoch": 0.95,
"learning_rate": 9.533733733733734e-06,
"loss": 0.3172,
"step": 23800
},
{
"epoch": 0.95,
"learning_rate": 9.533233233233235e-06,
"loss": 0.3206,
"step": 23825
},
{
"epoch": 0.95,
"learning_rate": 9.532752752752752e-06,
"loss": 0.3261,
"step": 23850
},
{
"epoch": 0.95,
"learning_rate": 9.532252252252253e-06,
"loss": 0.3204,
"step": 23875
},
{
"epoch": 0.95,
"learning_rate": 9.531751751751753e-06,
"loss": 0.3154,
"step": 23900
},
{
"epoch": 0.95,
"learning_rate": 9.531251251251252e-06,
"loss": 0.3159,
"step": 23925
},
{
"epoch": 0.96,
"learning_rate": 9.530750750750751e-06,
"loss": 0.326,
"step": 23950
},
{
"epoch": 0.96,
"learning_rate": 9.53025025025025e-06,
"loss": 0.3014,
"step": 23975
},
{
"epoch": 0.96,
"learning_rate": 9.52974974974975e-06,
"loss": 0.312,
"step": 24000
},
{
"epoch": 0.96,
"eval_loss": 0.46919143199920654,
"eval_runtime": 2551.3752,
"eval_samples_per_second": 6.355,
"eval_steps_per_second": 0.159,
"eval_wer": 28.381680683929357,
"step": 24000
},
{
"epoch": 0.96,
"learning_rate": 9.529249249249251e-06,
"loss": 0.317,
"step": 24025
},
{
"epoch": 0.96,
"learning_rate": 9.52874874874875e-06,
"loss": 0.3128,
"step": 24050
},
{
"epoch": 0.96,
"learning_rate": 9.528248248248248e-06,
"loss": 0.324,
"step": 24075
},
{
"epoch": 0.96,
"learning_rate": 9.527747747747749e-06,
"loss": 0.3367,
"step": 24100
},
{
"epoch": 0.96,
"learning_rate": 9.527247247247248e-06,
"loss": 0.3159,
"step": 24125
},
{
"epoch": 0.96,
"learning_rate": 9.526746746746747e-06,
"loss": 0.3288,
"step": 24150
},
{
"epoch": 0.96,
"learning_rate": 9.526246246246247e-06,
"loss": 0.3379,
"step": 24175
},
{
"epoch": 0.97,
"learning_rate": 9.525745745745748e-06,
"loss": 0.3359,
"step": 24200
},
{
"epoch": 0.97,
"learning_rate": 9.525245245245245e-06,
"loss": 0.3146,
"step": 24225
},
{
"epoch": 0.97,
"learning_rate": 9.524744744744745e-06,
"loss": 0.3054,
"step": 24250
},
{
"epoch": 0.97,
"learning_rate": 9.524244244244246e-06,
"loss": 0.3329,
"step": 24275
},
{
"epoch": 0.97,
"learning_rate": 9.523743743743745e-06,
"loss": 0.3157,
"step": 24300
},
{
"epoch": 0.97,
"learning_rate": 9.523243243243244e-06,
"loss": 0.3252,
"step": 24325
},
{
"epoch": 0.97,
"learning_rate": 9.522742742742743e-06,
"loss": 0.3199,
"step": 24350
},
{
"epoch": 0.97,
"learning_rate": 9.522242242242243e-06,
"loss": 0.2962,
"step": 24375
},
{
"epoch": 0.97,
"learning_rate": 9.521741741741742e-06,
"loss": 0.3197,
"step": 24400
},
{
"epoch": 0.97,
"learning_rate": 9.521241241241243e-06,
"loss": 0.3105,
"step": 24425
},
{
"epoch": 0.98,
"learning_rate": 9.520740740740742e-06,
"loss": 0.3158,
"step": 24450
},
{
"epoch": 0.98,
"learning_rate": 9.52024024024024e-06,
"loss": 0.3084,
"step": 24475
},
{
"epoch": 0.98,
"learning_rate": 9.519739739739741e-06,
"loss": 0.3258,
"step": 24500
},
{
"epoch": 0.98,
"learning_rate": 9.51923923923924e-06,
"loss": 0.3087,
"step": 24525
},
{
"epoch": 0.98,
"learning_rate": 9.51873873873874e-06,
"loss": 0.323,
"step": 24550
},
{
"epoch": 0.98,
"learning_rate": 9.518238238238239e-06,
"loss": 0.3153,
"step": 24575
},
{
"epoch": 0.98,
"learning_rate": 9.517737737737738e-06,
"loss": 0.3256,
"step": 24600
},
{
"epoch": 0.98,
"learning_rate": 9.517237237237237e-06,
"loss": 0.3461,
"step": 24625
},
{
"epoch": 0.98,
"learning_rate": 9.516736736736738e-06,
"loss": 0.319,
"step": 24650
},
{
"epoch": 0.98,
"learning_rate": 9.516236236236238e-06,
"loss": 0.3091,
"step": 24675
},
{
"epoch": 0.99,
"learning_rate": 9.515735735735735e-06,
"loss": 0.3109,
"step": 24700
},
{
"epoch": 0.99,
"learning_rate": 9.515235235235236e-06,
"loss": 0.3062,
"step": 24725
},
{
"epoch": 0.99,
"learning_rate": 9.514734734734736e-06,
"loss": 0.3162,
"step": 24750
},
{
"epoch": 0.99,
"learning_rate": 9.514234234234235e-06,
"loss": 0.3184,
"step": 24775
},
{
"epoch": 0.99,
"learning_rate": 9.513733733733734e-06,
"loss": 0.3168,
"step": 24800
},
{
"epoch": 0.99,
"learning_rate": 9.513233233233235e-06,
"loss": 0.315,
"step": 24825
},
{
"epoch": 0.99,
"learning_rate": 9.512732732732733e-06,
"loss": 0.3023,
"step": 24850
},
{
"epoch": 0.99,
"learning_rate": 9.512232232232232e-06,
"loss": 0.3242,
"step": 24875
},
{
"epoch": 0.99,
"learning_rate": 9.511731731731733e-06,
"loss": 0.3337,
"step": 24900
},
{
"epoch": 0.99,
"learning_rate": 9.511231231231232e-06,
"loss": 0.3149,
"step": 24925
},
{
"epoch": 0.99,
"learning_rate": 9.510730730730732e-06,
"loss": 0.3085,
"step": 24950
},
{
"epoch": 1.0,
"learning_rate": 9.510230230230231e-06,
"loss": 0.3263,
"step": 24975
},
{
"epoch": 1.0,
"learning_rate": 9.50972972972973e-06,
"loss": 0.3089,
"step": 25000
},
{
"epoch": 1.0,
"eval_loss": 0.457874059677124,
"eval_runtime": 2679.5488,
"eval_samples_per_second": 6.051,
"eval_steps_per_second": 0.152,
"eval_wer": 27.82818510495602,
"step": 25000
},
{
"epoch": 1.0,
"learning_rate": 9.50922922922923e-06,
"loss": 0.3246,
"step": 25025
},
{
"epoch": 1.0,
"learning_rate": 9.50872872872873e-06,
"loss": 0.3371,
"step": 25050
},
{
"epoch": 1.0,
"learning_rate": 9.50822822822823e-06,
"loss": 0.2992,
"step": 25075
},
{
"epoch": 1.0,
"learning_rate": 9.507727727727727e-06,
"loss": 0.2763,
"step": 25100
},
{
"epoch": 1.0,
"learning_rate": 9.507227227227228e-06,
"loss": 0.277,
"step": 25125
},
{
"epoch": 1.0,
"learning_rate": 9.506726726726728e-06,
"loss": 0.2702,
"step": 25150
},
{
"epoch": 1.0,
"learning_rate": 9.506226226226227e-06,
"loss": 0.2656,
"step": 25175
},
{
"epoch": 1.0,
"learning_rate": 9.505725725725726e-06,
"loss": 0.2767,
"step": 25200
},
{
"epoch": 1.01,
"learning_rate": 9.505225225225226e-06,
"loss": 0.2745,
"step": 25225
},
{
"epoch": 1.01,
"learning_rate": 9.504724724724725e-06,
"loss": 0.2637,
"step": 25250
},
{
"epoch": 1.01,
"learning_rate": 9.504224224224226e-06,
"loss": 0.2704,
"step": 25275
},
{
"epoch": 1.01,
"learning_rate": 9.503723723723725e-06,
"loss": 0.2554,
"step": 25300
},
{
"epoch": 1.01,
"learning_rate": 9.503223223223223e-06,
"loss": 0.271,
"step": 25325
},
{
"epoch": 1.01,
"learning_rate": 9.502722722722724e-06,
"loss": 0.2757,
"step": 25350
},
{
"epoch": 1.01,
"learning_rate": 9.502222222222223e-06,
"loss": 0.2606,
"step": 25375
},
{
"epoch": 1.01,
"learning_rate": 9.501721721721722e-06,
"loss": 0.2664,
"step": 25400
},
{
"epoch": 1.01,
"learning_rate": 9.501221221221222e-06,
"loss": 0.2702,
"step": 25425
},
{
"epoch": 1.01,
"learning_rate": 9.500720720720723e-06,
"loss": 0.2633,
"step": 25450
},
{
"epoch": 1.02,
"learning_rate": 9.50022022022022e-06,
"loss": 0.2816,
"step": 25475
},
{
"epoch": 1.02,
"learning_rate": 9.49971971971972e-06,
"loss": 0.2848,
"step": 25500
},
{
"epoch": 1.02,
"learning_rate": 9.49921921921922e-06,
"loss": 0.2655,
"step": 25525
},
{
"epoch": 1.02,
"learning_rate": 9.49871871871872e-06,
"loss": 0.2652,
"step": 25550
},
{
"epoch": 1.02,
"learning_rate": 9.49821821821822e-06,
"loss": 0.2704,
"step": 25575
},
{
"epoch": 1.02,
"learning_rate": 9.497717717717718e-06,
"loss": 0.2605,
"step": 25600
},
{
"epoch": 1.02,
"learning_rate": 9.497217217217218e-06,
"loss": 0.2674,
"step": 25625
},
{
"epoch": 1.02,
"learning_rate": 9.496716716716717e-06,
"loss": 0.2677,
"step": 25650
},
{
"epoch": 1.02,
"learning_rate": 9.496216216216218e-06,
"loss": 0.2761,
"step": 25675
},
{
"epoch": 1.02,
"learning_rate": 9.495715715715716e-06,
"loss": 0.2626,
"step": 25700
},
{
"epoch": 1.03,
"learning_rate": 9.495215215215215e-06,
"loss": 0.2637,
"step": 25725
},
{
"epoch": 1.03,
"learning_rate": 9.494714714714716e-06,
"loss": 0.2704,
"step": 25750
},
{
"epoch": 1.03,
"learning_rate": 9.494214214214215e-06,
"loss": 0.2756,
"step": 25775
},
{
"epoch": 1.03,
"learning_rate": 9.493713713713715e-06,
"loss": 0.2807,
"step": 25800
},
{
"epoch": 1.03,
"learning_rate": 9.493213213213214e-06,
"loss": 0.2798,
"step": 25825
},
{
"epoch": 1.03,
"learning_rate": 9.492712712712713e-06,
"loss": 0.2728,
"step": 25850
},
{
"epoch": 1.03,
"learning_rate": 9.492212212212212e-06,
"loss": 0.2664,
"step": 25875
},
{
"epoch": 1.03,
"learning_rate": 9.491731731731733e-06,
"loss": 0.2811,
"step": 25900
},
{
"epoch": 1.03,
"learning_rate": 9.491231231231231e-06,
"loss": 0.2582,
"step": 25925
},
{
"epoch": 1.03,
"learning_rate": 9.490730730730732e-06,
"loss": 0.2739,
"step": 25950
},
{
"epoch": 1.04,
"learning_rate": 9.490230230230231e-06,
"loss": 0.264,
"step": 25975
},
{
"epoch": 1.04,
"learning_rate": 9.48972972972973e-06,
"loss": 0.2625,
"step": 26000
},
{
"epoch": 1.04,
"eval_loss": 0.45843926072120667,
"eval_runtime": 2831.694,
"eval_samples_per_second": 5.726,
"eval_steps_per_second": 0.143,
"eval_wer": 27.744929502547777,
"step": 26000
},
{
"epoch": 1.04,
"learning_rate": 9.48922922922923e-06,
"loss": 0.2841,
"step": 26025
},
{
"epoch": 1.04,
"learning_rate": 9.48872872872873e-06,
"loss": 0.2881,
"step": 26050
},
{
"epoch": 1.04,
"learning_rate": 9.488228228228228e-06,
"loss": 0.2915,
"step": 26075
},
{
"epoch": 1.04,
"learning_rate": 9.487727727727728e-06,
"loss": 0.2687,
"step": 26100
},
{
"epoch": 1.04,
"learning_rate": 9.487227227227229e-06,
"loss": 0.2678,
"step": 26125
},
{
"epoch": 1.04,
"learning_rate": 9.486726726726728e-06,
"loss": 0.2724,
"step": 26150
},
{
"epoch": 1.04,
"learning_rate": 9.486226226226227e-06,
"loss": 0.2792,
"step": 26175
},
{
"epoch": 1.04,
"learning_rate": 9.485725725725727e-06,
"loss": 0.2657,
"step": 26200
},
{
"epoch": 1.05,
"learning_rate": 9.485225225225226e-06,
"loss": 0.2722,
"step": 26225
},
{
"epoch": 1.05,
"learning_rate": 9.484724724724725e-06,
"loss": 0.2704,
"step": 26250
},
{
"epoch": 1.05,
"learning_rate": 9.484224224224226e-06,
"loss": 0.2595,
"step": 26275
},
{
"epoch": 1.05,
"learning_rate": 9.483723723723724e-06,
"loss": 0.2699,
"step": 26300
},
{
"epoch": 1.05,
"learning_rate": 9.483223223223223e-06,
"loss": 0.2857,
"step": 26325
},
{
"epoch": 1.05,
"learning_rate": 9.482722722722724e-06,
"loss": 0.2664,
"step": 26350
},
{
"epoch": 1.05,
"learning_rate": 9.482222222222223e-06,
"loss": 0.2606,
"step": 26375
},
{
"epoch": 1.05,
"learning_rate": 9.481721721721723e-06,
"loss": 0.2607,
"step": 26400
},
{
"epoch": 1.05,
"learning_rate": 9.481221221221222e-06,
"loss": 0.2487,
"step": 26425
},
{
"epoch": 1.05,
"learning_rate": 9.480720720720721e-06,
"loss": 0.2603,
"step": 26450
},
{
"epoch": 1.06,
"learning_rate": 9.48022022022022e-06,
"loss": 0.2819,
"step": 26475
},
{
"epoch": 1.06,
"learning_rate": 9.479719719719721e-06,
"loss": 0.27,
"step": 26500
},
{
"epoch": 1.06,
"learning_rate": 9.47921921921922e-06,
"loss": 0.2577,
"step": 26525
},
{
"epoch": 1.06,
"learning_rate": 9.478718718718718e-06,
"loss": 0.2743,
"step": 26550
},
{
"epoch": 1.06,
"learning_rate": 9.47821821821822e-06,
"loss": 0.2806,
"step": 26575
},
{
"epoch": 1.06,
"learning_rate": 9.477717717717719e-06,
"loss": 0.2736,
"step": 26600
},
{
"epoch": 1.06,
"learning_rate": 9.477217217217218e-06,
"loss": 0.2699,
"step": 26625
},
{
"epoch": 1.06,
"learning_rate": 9.476716716716717e-06,
"loss": 0.2743,
"step": 26650
},
{
"epoch": 1.06,
"learning_rate": 9.476216216216218e-06,
"loss": 0.2706,
"step": 26675
},
{
"epoch": 1.06,
"learning_rate": 9.475715715715716e-06,
"loss": 0.2658,
"step": 26700
},
{
"epoch": 1.07,
"learning_rate": 9.475215215215215e-06,
"loss": 0.263,
"step": 26725
},
{
"epoch": 1.07,
"learning_rate": 9.474714714714716e-06,
"loss": 0.2653,
"step": 26750
},
{
"epoch": 1.07,
"learning_rate": 9.474214214214215e-06,
"loss": 0.2622,
"step": 26775
},
{
"epoch": 1.07,
"learning_rate": 9.473713713713715e-06,
"loss": 0.2743,
"step": 26800
},
{
"epoch": 1.07,
"learning_rate": 9.473213213213214e-06,
"loss": 0.2531,
"step": 26825
},
{
"epoch": 1.07,
"learning_rate": 9.472712712712713e-06,
"loss": 0.2686,
"step": 26850
},
{
"epoch": 1.07,
"learning_rate": 9.472212212212213e-06,
"loss": 0.2847,
"step": 26875
},
{
"epoch": 1.07,
"learning_rate": 9.471711711711714e-06,
"loss": 0.2556,
"step": 26900
},
{
"epoch": 1.07,
"learning_rate": 9.471211211211211e-06,
"loss": 0.2642,
"step": 26925
},
{
"epoch": 1.07,
"learning_rate": 9.47071071071071e-06,
"loss": 0.2719,
"step": 26950
},
{
"epoch": 1.08,
"learning_rate": 9.470210210210212e-06,
"loss": 0.2632,
"step": 26975
},
{
"epoch": 1.08,
"learning_rate": 9.46970970970971e-06,
"loss": 0.2758,
"step": 27000
},
{
"epoch": 1.08,
"eval_loss": 0.45501989126205444,
"eval_runtime": 2547.6663,
"eval_samples_per_second": 6.364,
"eval_steps_per_second": 0.159,
"eval_wer": 26.85301531748907,
"step": 27000
},
{
"epoch": 1.08,
"learning_rate": 9.46920920920921e-06,
"loss": 0.2766,
"step": 27025
},
{
"epoch": 1.08,
"learning_rate": 9.46870870870871e-06,
"loss": 0.2724,
"step": 27050
},
{
"epoch": 1.08,
"learning_rate": 9.468208208208209e-06,
"loss": 0.265,
"step": 27075
},
{
"epoch": 1.08,
"learning_rate": 9.467707707707708e-06,
"loss": 0.2627,
"step": 27100
},
{
"epoch": 1.08,
"learning_rate": 9.467207207207207e-06,
"loss": 0.2648,
"step": 27125
},
{
"epoch": 1.08,
"learning_rate": 9.466706706706708e-06,
"loss": 0.2676,
"step": 27150
},
{
"epoch": 1.08,
"learning_rate": 9.466206206206206e-06,
"loss": 0.2634,
"step": 27175
},
{
"epoch": 1.08,
"learning_rate": 9.465705705705707e-06,
"loss": 0.2631,
"step": 27200
},
{
"epoch": 1.09,
"learning_rate": 9.465205205205206e-06,
"loss": 0.2729,
"step": 27225
},
{
"epoch": 1.09,
"learning_rate": 9.464704704704705e-06,
"loss": 0.2772,
"step": 27250
},
{
"epoch": 1.09,
"learning_rate": 9.464204204204205e-06,
"loss": 0.2605,
"step": 27275
},
{
"epoch": 1.09,
"learning_rate": 9.463703703703706e-06,
"loss": 0.2753,
"step": 27300
},
{
"epoch": 1.09,
"learning_rate": 9.463203203203203e-06,
"loss": 0.2719,
"step": 27325
},
{
"epoch": 1.09,
"learning_rate": 9.462702702702703e-06,
"loss": 0.2802,
"step": 27350
},
{
"epoch": 1.09,
"learning_rate": 9.462202202202204e-06,
"loss": 0.2579,
"step": 27375
},
{
"epoch": 1.09,
"learning_rate": 9.461701701701701e-06,
"loss": 0.2781,
"step": 27400
},
{
"epoch": 1.09,
"learning_rate": 9.461201201201202e-06,
"loss": 0.292,
"step": 27425
},
{
"epoch": 1.09,
"learning_rate": 9.460700700700702e-06,
"loss": 0.25,
"step": 27450
},
{
"epoch": 1.1,
"learning_rate": 9.460200200200201e-06,
"loss": 0.2518,
"step": 27475
},
{
"epoch": 1.1,
"learning_rate": 9.4596996996997e-06,
"loss": 0.264,
"step": 27500
},
{
"epoch": 1.1,
"learning_rate": 9.459199199199201e-06,
"loss": 0.2603,
"step": 27525
},
{
"epoch": 1.1,
"learning_rate": 9.458698698698699e-06,
"loss": 0.2601,
"step": 27550
},
{
"epoch": 1.1,
"learning_rate": 9.458198198198198e-06,
"loss": 0.275,
"step": 27575
},
{
"epoch": 1.1,
"learning_rate": 9.457697697697699e-06,
"loss": 0.2681,
"step": 27600
},
{
"epoch": 1.1,
"learning_rate": 9.457197197197198e-06,
"loss": 0.2595,
"step": 27625
},
{
"epoch": 1.1,
"learning_rate": 9.456696696696698e-06,
"loss": 0.2797,
"step": 27650
},
{
"epoch": 1.1,
"learning_rate": 9.456196196196197e-06,
"loss": 0.2564,
"step": 27675
},
{
"epoch": 1.1,
"learning_rate": 9.455695695695696e-06,
"loss": 0.2565,
"step": 27700
},
{
"epoch": 1.11,
"learning_rate": 9.455195195195196e-06,
"loss": 0.2833,
"step": 27725
},
{
"epoch": 1.11,
"learning_rate": 9.454694694694695e-06,
"loss": 0.2648,
"step": 27750
},
{
"epoch": 1.11,
"learning_rate": 9.454194194194196e-06,
"loss": 0.2607,
"step": 27775
},
{
"epoch": 1.11,
"learning_rate": 9.453693693693693e-06,
"loss": 0.2697,
"step": 27800
},
{
"epoch": 1.11,
"learning_rate": 9.453193193193194e-06,
"loss": 0.2778,
"step": 27825
},
{
"epoch": 1.11,
"learning_rate": 9.452692692692694e-06,
"loss": 0.2616,
"step": 27850
},
{
"epoch": 1.11,
"learning_rate": 9.452192192192193e-06,
"loss": 0.27,
"step": 27875
},
{
"epoch": 1.11,
"learning_rate": 9.451691691691692e-06,
"loss": 0.2726,
"step": 27900
},
{
"epoch": 1.11,
"learning_rate": 9.451191191191193e-06,
"loss": 0.2444,
"step": 27925
},
{
"epoch": 1.11,
"learning_rate": 9.450690690690691e-06,
"loss": 0.258,
"step": 27950
},
{
"epoch": 1.12,
"learning_rate": 9.45019019019019e-06,
"loss": 0.2758,
"step": 27975
},
{
"epoch": 1.12,
"learning_rate": 9.449689689689691e-06,
"loss": 0.265,
"step": 28000
},
{
"epoch": 1.12,
"eval_loss": 0.45008718967437744,
"eval_runtime": 2652.1712,
"eval_samples_per_second": 6.113,
"eval_steps_per_second": 0.153,
"eval_wer": 28.59213234557242,
"step": 28000
},
{
"epoch": 1.12,
"learning_rate": 9.44920920920921e-06,
"loss": 0.2703,
"step": 28025
},
{
"epoch": 1.12,
"learning_rate": 9.44870870870871e-06,
"loss": 0.2573,
"step": 28050
},
{
"epoch": 1.12,
"learning_rate": 9.448208208208209e-06,
"loss": 0.2824,
"step": 28075
},
{
"epoch": 1.12,
"learning_rate": 9.447707707707708e-06,
"loss": 0.2697,
"step": 28100
},
{
"epoch": 1.12,
"learning_rate": 9.44720720720721e-06,
"loss": 0.2586,
"step": 28125
},
{
"epoch": 1.12,
"learning_rate": 9.446706706706707e-06,
"loss": 0.2882,
"step": 28150
},
{
"epoch": 1.12,
"learning_rate": 9.446206206206206e-06,
"loss": 0.2649,
"step": 28175
},
{
"epoch": 1.12,
"learning_rate": 9.445705705705707e-06,
"loss": 0.2542,
"step": 28200
},
{
"epoch": 1.13,
"learning_rate": 9.445205205205206e-06,
"loss": 0.263,
"step": 28225
},
{
"epoch": 1.13,
"learning_rate": 9.444704704704706e-06,
"loss": 0.2729,
"step": 28250
},
{
"epoch": 1.13,
"learning_rate": 9.444204204204205e-06,
"loss": 0.2861,
"step": 28275
},
{
"epoch": 1.13,
"learning_rate": 9.443703703703704e-06,
"loss": 0.2692,
"step": 28300
},
{
"epoch": 1.13,
"learning_rate": 9.443203203203204e-06,
"loss": 0.2826,
"step": 28325
},
{
"epoch": 1.13,
"learning_rate": 9.442702702702703e-06,
"loss": 0.2795,
"step": 28350
},
{
"epoch": 1.13,
"learning_rate": 9.442202202202204e-06,
"loss": 0.2655,
"step": 28375
},
{
"epoch": 1.13,
"learning_rate": 9.441701701701701e-06,
"loss": 0.2605,
"step": 28400
},
{
"epoch": 1.13,
"learning_rate": 9.441201201201202e-06,
"loss": 0.2626,
"step": 28425
},
{
"epoch": 1.13,
"learning_rate": 9.440700700700702e-06,
"loss": 0.2867,
"step": 28450
},
{
"epoch": 1.14,
"learning_rate": 9.440200200200201e-06,
"loss": 0.272,
"step": 28475
},
{
"epoch": 1.14,
"learning_rate": 9.4396996996997e-06,
"loss": 0.257,
"step": 28500
},
{
"epoch": 1.14,
"learning_rate": 9.4391991991992e-06,
"loss": 0.2783,
"step": 28525
},
{
"epoch": 1.14,
"learning_rate": 9.438698698698699e-06,
"loss": 0.2602,
"step": 28550
},
{
"epoch": 1.14,
"learning_rate": 9.438198198198198e-06,
"loss": 0.2644,
"step": 28575
},
{
"epoch": 1.14,
"learning_rate": 9.4376976976977e-06,
"loss": 0.2554,
"step": 28600
},
{
"epoch": 1.14,
"learning_rate": 9.437197197197197e-06,
"loss": 0.2743,
"step": 28625
},
{
"epoch": 1.14,
"learning_rate": 9.436696696696698e-06,
"loss": 0.2724,
"step": 28650
},
{
"epoch": 1.14,
"learning_rate": 9.436196196196197e-06,
"loss": 0.2607,
"step": 28675
},
{
"epoch": 1.14,
"learning_rate": 9.435695695695696e-06,
"loss": 0.2626,
"step": 28700
},
{
"epoch": 1.15,
"learning_rate": 9.435195195195196e-06,
"loss": 0.2616,
"step": 28725
},
{
"epoch": 1.15,
"learning_rate": 9.434694694694697e-06,
"loss": 0.2602,
"step": 28750
},
{
"epoch": 1.15,
"learning_rate": 9.434194194194194e-06,
"loss": 0.2639,
"step": 28775
},
{
"epoch": 1.15,
"learning_rate": 9.433693693693694e-06,
"loss": 0.2564,
"step": 28800
},
{
"epoch": 1.15,
"learning_rate": 9.433193193193195e-06,
"loss": 0.2544,
"step": 28825
},
{
"epoch": 1.15,
"learning_rate": 9.432692692692694e-06,
"loss": 0.2874,
"step": 28850
},
{
"epoch": 1.15,
"learning_rate": 9.432192192192193e-06,
"loss": 0.2663,
"step": 28875
},
{
"epoch": 1.15,
"learning_rate": 9.431691691691692e-06,
"loss": 0.2658,
"step": 28900
},
{
"epoch": 1.15,
"learning_rate": 9.431191191191192e-06,
"loss": 0.286,
"step": 28925
},
{
"epoch": 1.15,
"learning_rate": 9.430690690690691e-06,
"loss": 0.2451,
"step": 28950
},
{
"epoch": 1.16,
"learning_rate": 9.43019019019019e-06,
"loss": 0.2811,
"step": 28975
},
{
"epoch": 1.16,
"learning_rate": 9.429689689689691e-06,
"loss": 0.258,
"step": 29000
},
{
"epoch": 1.16,
"eval_loss": 0.44391068816185,
"eval_runtime": 2504.9501,
"eval_samples_per_second": 6.472,
"eval_steps_per_second": 0.162,
"eval_wer": 26.30877036100554,
"step": 29000
},
{
"epoch": 1.16,
"learning_rate": 9.429189189189189e-06,
"loss": 0.2654,
"step": 29025
},
{
"epoch": 1.16,
"learning_rate": 9.42868868868869e-06,
"loss": 0.2587,
"step": 29050
},
{
"epoch": 1.16,
"learning_rate": 9.42818818818819e-06,
"loss": 0.2571,
"step": 29075
},
{
"epoch": 1.16,
"learning_rate": 9.427687687687689e-06,
"loss": 0.2734,
"step": 29100
},
{
"epoch": 1.16,
"learning_rate": 9.427187187187188e-06,
"loss": 0.2898,
"step": 29125
},
{
"epoch": 1.16,
"learning_rate": 9.426686686686687e-06,
"loss": 0.2514,
"step": 29150
},
{
"epoch": 1.16,
"learning_rate": 9.426186186186186e-06,
"loss": 0.2804,
"step": 29175
},
{
"epoch": 1.16,
"learning_rate": 9.425685685685686e-06,
"loss": 0.2812,
"step": 29200
},
{
"epoch": 1.17,
"learning_rate": 9.425185185185187e-06,
"loss": 0.265,
"step": 29225
},
{
"epoch": 1.17,
"learning_rate": 9.424684684684684e-06,
"loss": 0.2546,
"step": 29250
},
{
"epoch": 1.17,
"learning_rate": 9.424184184184185e-06,
"loss": 0.2818,
"step": 29275
},
{
"epoch": 1.17,
"learning_rate": 9.423683683683685e-06,
"loss": 0.2448,
"step": 29300
},
{
"epoch": 1.17,
"learning_rate": 9.423183183183184e-06,
"loss": 0.2791,
"step": 29325
},
{
"epoch": 1.17,
"learning_rate": 9.422682682682683e-06,
"loss": 0.2583,
"step": 29350
},
{
"epoch": 1.17,
"learning_rate": 9.422182182182184e-06,
"loss": 0.2737,
"step": 29375
},
{
"epoch": 1.17,
"learning_rate": 9.421701701701702e-06,
"loss": 0.266,
"step": 29400
},
{
"epoch": 1.17,
"learning_rate": 9.421201201201203e-06,
"loss": 0.265,
"step": 29425
},
{
"epoch": 1.17,
"learning_rate": 9.420700700700702e-06,
"loss": 0.2771,
"step": 29450
},
{
"epoch": 1.18,
"learning_rate": 9.420200200200201e-06,
"loss": 0.2569,
"step": 29475
},
{
"epoch": 1.18,
"learning_rate": 9.4196996996997e-06,
"loss": 0.2621,
"step": 29500
},
{
"epoch": 1.18,
"learning_rate": 9.4191991991992e-06,
"loss": 0.2703,
"step": 29525
},
{
"epoch": 1.18,
"learning_rate": 9.418698698698699e-06,
"loss": 0.2786,
"step": 29550
},
{
"epoch": 1.18,
"learning_rate": 9.418198198198198e-06,
"loss": 0.2628,
"step": 29575
},
{
"epoch": 1.18,
"learning_rate": 9.4176976976977e-06,
"loss": 0.295,
"step": 29600
},
{
"epoch": 1.18,
"learning_rate": 9.417197197197197e-06,
"loss": 0.2829,
"step": 29625
},
{
"epoch": 1.18,
"learning_rate": 9.416696696696698e-06,
"loss": 0.2721,
"step": 29650
},
{
"epoch": 1.18,
"learning_rate": 9.416196196196197e-06,
"loss": 0.2721,
"step": 29675
},
{
"epoch": 1.18,
"learning_rate": 9.415695695695697e-06,
"loss": 0.2683,
"step": 29700
},
{
"epoch": 1.19,
"learning_rate": 9.415195195195196e-06,
"loss": 0.2655,
"step": 29725
},
{
"epoch": 1.19,
"learning_rate": 9.414694694694695e-06,
"loss": 0.2567,
"step": 29750
},
{
"epoch": 1.19,
"learning_rate": 9.414194194194194e-06,
"loss": 0.2542,
"step": 29775
},
{
"epoch": 1.19,
"learning_rate": 9.413693693693694e-06,
"loss": 0.2722,
"step": 29800
},
{
"epoch": 1.19,
"learning_rate": 9.413193193193195e-06,
"loss": 0.2707,
"step": 29825
},
{
"epoch": 1.19,
"learning_rate": 9.412692692692692e-06,
"loss": 0.2718,
"step": 29850
},
{
"epoch": 1.19,
"learning_rate": 9.412192192192193e-06,
"loss": 0.2634,
"step": 29875
},
{
"epoch": 1.19,
"learning_rate": 9.411691691691693e-06,
"loss": 0.2643,
"step": 29900
},
{
"epoch": 1.19,
"learning_rate": 9.411191191191192e-06,
"loss": 0.2618,
"step": 29925
},
{
"epoch": 1.19,
"learning_rate": 9.410690690690691e-06,
"loss": 0.2684,
"step": 29950
},
{
"epoch": 1.2,
"learning_rate": 9.41019019019019e-06,
"loss": 0.282,
"step": 29975
},
{
"epoch": 1.2,
"learning_rate": 9.40968968968969e-06,
"loss": 0.2837,
"step": 30000
},
{
"epoch": 1.2,
"eval_loss": 0.4546422064304352,
"eval_runtime": 2695.5326,
"eval_samples_per_second": 6.015,
"eval_steps_per_second": 0.151,
"eval_wer": 27.167536482142445,
"step": 30000
},
{
"epoch": 1.2,
"learning_rate": 9.40918918918919e-06,
"loss": 0.2669,
"step": 30025
},
{
"epoch": 1.2,
"learning_rate": 9.40868868868869e-06,
"loss": 0.2881,
"step": 30050
},
{
"epoch": 1.2,
"learning_rate": 9.40818818818819e-06,
"loss": 0.2759,
"step": 30075
},
{
"epoch": 1.2,
"learning_rate": 9.407687687687689e-06,
"loss": 0.2568,
"step": 30100
},
{
"epoch": 1.2,
"learning_rate": 9.407187187187188e-06,
"loss": 0.2779,
"step": 30125
},
{
"epoch": 1.2,
"learning_rate": 9.406686686686687e-06,
"loss": 0.2668,
"step": 30150
},
{
"epoch": 1.2,
"learning_rate": 9.406186186186187e-06,
"loss": 0.272,
"step": 30175
},
{
"epoch": 1.2,
"learning_rate": 9.405685685685686e-06,
"loss": 0.2638,
"step": 30200
},
{
"epoch": 1.21,
"learning_rate": 9.405185185185187e-06,
"loss": 0.27,
"step": 30225
},
{
"epoch": 1.21,
"learning_rate": 9.404684684684685e-06,
"loss": 0.2757,
"step": 30250
},
{
"epoch": 1.21,
"learning_rate": 9.404184184184186e-06,
"loss": 0.2499,
"step": 30275
},
{
"epoch": 1.21,
"learning_rate": 9.403683683683685e-06,
"loss": 0.2886,
"step": 30300
},
{
"epoch": 1.21,
"learning_rate": 9.403183183183184e-06,
"loss": 0.2756,
"step": 30325
},
{
"epoch": 1.21,
"learning_rate": 9.402682682682683e-06,
"loss": 0.261,
"step": 30350
},
{
"epoch": 1.21,
"learning_rate": 9.402182182182183e-06,
"loss": 0.2748,
"step": 30375
},
{
"epoch": 1.21,
"learning_rate": 9.401681681681682e-06,
"loss": 0.261,
"step": 30400
},
{
"epoch": 1.21,
"learning_rate": 9.401181181181181e-06,
"loss": 0.2839,
"step": 30425
},
{
"epoch": 1.21,
"learning_rate": 9.400680680680682e-06,
"loss": 0.2735,
"step": 30450
},
{
"epoch": 1.22,
"learning_rate": 9.40018018018018e-06,
"loss": 0.2659,
"step": 30475
},
{
"epoch": 1.22,
"learning_rate": 9.3996996996997e-06,
"loss": 0.2621,
"step": 30500
},
{
"epoch": 1.22,
"learning_rate": 9.3991991991992e-06,
"loss": 0.2744,
"step": 30525
},
{
"epoch": 1.22,
"learning_rate": 9.3986986986987e-06,
"loss": 0.2632,
"step": 30550
},
{
"epoch": 1.22,
"learning_rate": 9.398198198198199e-06,
"loss": 0.2589,
"step": 30575
},
{
"epoch": 1.22,
"learning_rate": 9.397697697697698e-06,
"loss": 0.2528,
"step": 30600
},
{
"epoch": 1.22,
"learning_rate": 9.397197197197197e-06,
"loss": 0.265,
"step": 30625
},
{
"epoch": 1.22,
"learning_rate": 9.396696696696698e-06,
"loss": 0.2569,
"step": 30650
},
{
"epoch": 1.22,
"learning_rate": 9.396196196196197e-06,
"loss": 0.2646,
"step": 30675
},
{
"epoch": 1.22,
"learning_rate": 9.395695695695697e-06,
"loss": 0.2737,
"step": 30700
},
{
"epoch": 1.23,
"learning_rate": 9.395195195195196e-06,
"loss": 0.2555,
"step": 30725
},
{
"epoch": 1.23,
"learning_rate": 9.394694694694695e-06,
"loss": 0.2671,
"step": 30750
},
{
"epoch": 1.23,
"learning_rate": 9.394194194194195e-06,
"loss": 0.2693,
"step": 30775
},
{
"epoch": 1.23,
"learning_rate": 9.393693693693694e-06,
"loss": 0.2795,
"step": 30800
},
{
"epoch": 1.23,
"learning_rate": 9.393193193193193e-06,
"loss": 0.2641,
"step": 30825
},
{
"epoch": 1.23,
"learning_rate": 9.392692692692693e-06,
"loss": 0.2789,
"step": 30850
},
{
"epoch": 1.23,
"learning_rate": 9.392192192192194e-06,
"loss": 0.2617,
"step": 30875
},
{
"epoch": 1.23,
"learning_rate": 9.391691691691693e-06,
"loss": 0.2536,
"step": 30900
},
{
"epoch": 1.23,
"learning_rate": 9.391191191191192e-06,
"loss": 0.2636,
"step": 30925
},
{
"epoch": 1.23,
"learning_rate": 9.390690690690691e-06,
"loss": 0.2713,
"step": 30950
},
{
"epoch": 1.24,
"learning_rate": 9.39019019019019e-06,
"loss": 0.2741,
"step": 30975
},
{
"epoch": 1.24,
"learning_rate": 9.38968968968969e-06,
"loss": 0.2804,
"step": 31000
},
{
"epoch": 1.24,
"eval_loss": 0.44737279415130615,
"eval_runtime": 2512.7508,
"eval_samples_per_second": 6.452,
"eval_steps_per_second": 0.162,
"eval_wer": 26.34577285096476,
"step": 31000
},
{
"epoch": 1.24,
"learning_rate": 9.38918918918919e-06,
"loss": 0.277,
"step": 31025
},
{
"epoch": 1.24,
"learning_rate": 9.38868868868869e-06,
"loss": 0.2563,
"step": 31050
},
{
"epoch": 1.24,
"learning_rate": 9.388188188188188e-06,
"loss": 0.2455,
"step": 31075
},
{
"epoch": 1.24,
"learning_rate": 9.387687687687689e-06,
"loss": 0.2606,
"step": 31100
},
{
"epoch": 1.24,
"learning_rate": 9.387187187187188e-06,
"loss": 0.2602,
"step": 31125
},
{
"epoch": 1.24,
"learning_rate": 9.386686686686688e-06,
"loss": 0.2576,
"step": 31150
},
{
"epoch": 1.24,
"learning_rate": 9.386186186186187e-06,
"loss": 0.27,
"step": 31175
},
{
"epoch": 1.24,
"learning_rate": 9.385685685685686e-06,
"loss": 0.2806,
"step": 31200
},
{
"epoch": 1.25,
"learning_rate": 9.385185185185185e-06,
"loss": 0.2673,
"step": 31225
},
{
"epoch": 1.25,
"learning_rate": 9.384684684684685e-06,
"loss": 0.2766,
"step": 31250
},
{
"epoch": 1.25,
"learning_rate": 9.384184184184186e-06,
"loss": 0.2575,
"step": 31275
},
{
"epoch": 1.25,
"learning_rate": 9.383683683683685e-06,
"loss": 0.2526,
"step": 31300
},
{
"epoch": 1.25,
"learning_rate": 9.383183183183184e-06,
"loss": 0.2678,
"step": 31325
},
{
"epoch": 1.25,
"learning_rate": 9.382682682682684e-06,
"loss": 0.2711,
"step": 31350
},
{
"epoch": 1.25,
"learning_rate": 9.382182182182183e-06,
"loss": 0.2889,
"step": 31375
},
{
"epoch": 1.25,
"learning_rate": 9.381681681681682e-06,
"loss": 0.2709,
"step": 31400
},
{
"epoch": 1.25,
"learning_rate": 9.381181181181182e-06,
"loss": 0.2736,
"step": 31425
},
{
"epoch": 1.25,
"learning_rate": 9.38068068068068e-06,
"loss": 0.2699,
"step": 31450
},
{
"epoch": 1.26,
"learning_rate": 9.38018018018018e-06,
"loss": 0.2801,
"step": 31475
},
{
"epoch": 1.26,
"learning_rate": 9.379679679679681e-06,
"loss": 0.2774,
"step": 31500
},
{
"epoch": 1.26,
"learning_rate": 9.37917917917918e-06,
"loss": 0.2658,
"step": 31525
},
{
"epoch": 1.26,
"learning_rate": 9.37867867867868e-06,
"loss": 0.2663,
"step": 31550
},
{
"epoch": 1.26,
"learning_rate": 9.378178178178179e-06,
"loss": 0.2673,
"step": 31575
},
{
"epoch": 1.26,
"learning_rate": 9.377677677677678e-06,
"loss": 0.2722,
"step": 31600
},
{
"epoch": 1.26,
"learning_rate": 9.377177177177178e-06,
"loss": 0.2818,
"step": 31625
},
{
"epoch": 1.26,
"learning_rate": 9.376676676676677e-06,
"loss": 0.2689,
"step": 31650
},
{
"epoch": 1.26,
"learning_rate": 9.376176176176178e-06,
"loss": 0.2755,
"step": 31675
},
{
"epoch": 1.26,
"learning_rate": 9.375675675675675e-06,
"loss": 0.2563,
"step": 31700
},
{
"epoch": 1.27,
"learning_rate": 9.375175175175176e-06,
"loss": 0.2691,
"step": 31725
},
{
"epoch": 1.27,
"learning_rate": 9.374674674674676e-06,
"loss": 0.2775,
"step": 31750
},
{
"epoch": 1.27,
"learning_rate": 9.374174174174175e-06,
"loss": 0.2625,
"step": 31775
},
{
"epoch": 1.27,
"learning_rate": 9.373673673673674e-06,
"loss": 0.2526,
"step": 31800
},
{
"epoch": 1.27,
"learning_rate": 9.373173173173174e-06,
"loss": 0.2624,
"step": 31825
},
{
"epoch": 1.27,
"learning_rate": 9.372672672672673e-06,
"loss": 0.2823,
"step": 31850
},
{
"epoch": 1.27,
"learning_rate": 9.372172172172172e-06,
"loss": 0.2637,
"step": 31875
},
{
"epoch": 1.27,
"learning_rate": 9.371671671671673e-06,
"loss": 0.2747,
"step": 31900
},
{
"epoch": 1.27,
"learning_rate": 9.371171171171173e-06,
"loss": 0.2795,
"step": 31925
},
{
"epoch": 1.27,
"learning_rate": 9.370670670670672e-06,
"loss": 0.2643,
"step": 31950
},
{
"epoch": 1.28,
"learning_rate": 9.370170170170171e-06,
"loss": 0.2799,
"step": 31975
},
{
"epoch": 1.28,
"learning_rate": 9.36966966966967e-06,
"loss": 0.2612,
"step": 32000
},
{
"epoch": 1.28,
"eval_loss": 0.4532637298107147,
"eval_runtime": 2555.128,
"eval_samples_per_second": 6.345,
"eval_steps_per_second": 0.159,
"eval_wer": 25.984998573862367,
"step": 32000
},
{
"epoch": 1.28,
"learning_rate": 9.36916916916917e-06,
"loss": 0.2583,
"step": 32025
},
{
"epoch": 1.28,
"learning_rate": 9.368668668668669e-06,
"loss": 0.257,
"step": 32050
},
{
"epoch": 1.28,
"learning_rate": 9.368168168168168e-06,
"loss": 0.2726,
"step": 32075
},
{
"epoch": 1.28,
"learning_rate": 9.367667667667668e-06,
"loss": 0.2675,
"step": 32100
},
{
"epoch": 1.28,
"learning_rate": 9.367167167167169e-06,
"loss": 0.2606,
"step": 32125
},
{
"epoch": 1.28,
"learning_rate": 9.366666666666668e-06,
"loss": 0.2672,
"step": 32150
},
{
"epoch": 1.28,
"learning_rate": 9.366166166166167e-06,
"loss": 0.2622,
"step": 32175
},
{
"epoch": 1.28,
"learning_rate": 9.365665665665666e-06,
"loss": 0.2592,
"step": 32200
},
{
"epoch": 1.29,
"learning_rate": 9.365165165165166e-06,
"loss": 0.2618,
"step": 32225
},
{
"epoch": 1.29,
"learning_rate": 9.364664664664665e-06,
"loss": 0.2669,
"step": 32250
},
{
"epoch": 1.29,
"learning_rate": 9.364164164164164e-06,
"loss": 0.2725,
"step": 32275
},
{
"epoch": 1.29,
"learning_rate": 9.363663663663665e-06,
"loss": 0.2695,
"step": 32300
},
{
"epoch": 1.29,
"learning_rate": 9.363163163163163e-06,
"loss": 0.2727,
"step": 32325
},
{
"epoch": 1.29,
"learning_rate": 9.362662662662664e-06,
"loss": 0.28,
"step": 32350
},
{
"epoch": 1.29,
"learning_rate": 9.362162162162163e-06,
"loss": 0.2826,
"step": 32375
},
{
"epoch": 1.29,
"learning_rate": 9.361661661661663e-06,
"loss": 0.2728,
"step": 32400
},
{
"epoch": 1.29,
"learning_rate": 9.361161161161162e-06,
"loss": 0.2653,
"step": 32425
},
{
"epoch": 1.29,
"learning_rate": 9.360660660660661e-06,
"loss": 0.2655,
"step": 32450
},
{
"epoch": 1.3,
"learning_rate": 9.36016016016016e-06,
"loss": 0.2787,
"step": 32475
},
{
"epoch": 1.3,
"learning_rate": 9.35965965965966e-06,
"loss": 0.2677,
"step": 32500
},
{
"epoch": 1.3,
"learning_rate": 9.35915915915916e-06,
"loss": 0.2587,
"step": 32525
},
{
"epoch": 1.3,
"learning_rate": 9.358658658658658e-06,
"loss": 0.2685,
"step": 32550
},
{
"epoch": 1.3,
"learning_rate": 9.35815815815816e-06,
"loss": 0.2583,
"step": 32575
},
{
"epoch": 1.3,
"learning_rate": 9.357657657657659e-06,
"loss": 0.2673,
"step": 32600
},
{
"epoch": 1.3,
"learning_rate": 9.357157157157158e-06,
"loss": 0.2828,
"step": 32625
},
{
"epoch": 1.3,
"learning_rate": 9.356656656656657e-06,
"loss": 0.2753,
"step": 32650
},
{
"epoch": 1.3,
"learning_rate": 9.356156156156157e-06,
"loss": 0.2847,
"step": 32675
},
{
"epoch": 1.3,
"learning_rate": 9.355655655655656e-06,
"loss": 0.2671,
"step": 32700
},
{
"epoch": 1.31,
"learning_rate": 9.355155155155155e-06,
"loss": 0.2655,
"step": 32725
},
{
"epoch": 1.31,
"learning_rate": 9.354654654654656e-06,
"loss": 0.2602,
"step": 32750
},
{
"epoch": 1.31,
"learning_rate": 9.354154154154155e-06,
"loss": 0.2707,
"step": 32775
},
{
"epoch": 1.31,
"learning_rate": 9.353653653653655e-06,
"loss": 0.2577,
"step": 32800
},
{
"epoch": 1.31,
"learning_rate": 9.353153153153154e-06,
"loss": 0.2786,
"step": 32825
},
{
"epoch": 1.31,
"learning_rate": 9.352652652652653e-06,
"loss": 0.2529,
"step": 32850
},
{
"epoch": 1.31,
"learning_rate": 9.352152152152153e-06,
"loss": 0.2544,
"step": 32875
},
{
"epoch": 1.31,
"learning_rate": 9.351651651651652e-06,
"loss": 0.2748,
"step": 32900
},
{
"epoch": 1.31,
"learning_rate": 9.351151151151153e-06,
"loss": 0.2696,
"step": 32925
},
{
"epoch": 1.31,
"learning_rate": 9.35065065065065e-06,
"loss": 0.2646,
"step": 32950
},
{
"epoch": 1.32,
"learning_rate": 9.350150150150151e-06,
"loss": 0.2598,
"step": 32975
},
{
"epoch": 1.32,
"learning_rate": 9.34964964964965e-06,
"loss": 0.2551,
"step": 33000
},
{
"epoch": 1.32,
"eval_loss": 0.4496789276599884,
"eval_runtime": 2555.1297,
"eval_samples_per_second": 6.345,
"eval_steps_per_second": 0.159,
"eval_wer": 26.183886957393177,
"step": 33000
},
{
"epoch": 1.32,
"learning_rate": 9.34914914914915e-06,
"loss": 0.2877,
"step": 33025
},
{
"epoch": 1.32,
"learning_rate": 9.34864864864865e-06,
"loss": 0.2536,
"step": 33050
},
{
"epoch": 1.32,
"learning_rate": 9.348148148148149e-06,
"loss": 0.2592,
"step": 33075
},
{
"epoch": 1.32,
"learning_rate": 9.347647647647648e-06,
"loss": 0.2691,
"step": 33100
},
{
"epoch": 1.32,
"learning_rate": 9.347147147147147e-06,
"loss": 0.269,
"step": 33125
},
{
"epoch": 1.32,
"learning_rate": 9.346646646646648e-06,
"loss": 0.2585,
"step": 33150
},
{
"epoch": 1.32,
"learning_rate": 9.346146146146146e-06,
"loss": 0.2547,
"step": 33175
},
{
"epoch": 1.32,
"learning_rate": 9.345645645645647e-06,
"loss": 0.278,
"step": 33200
},
{
"epoch": 1.32,
"learning_rate": 9.345145145145146e-06,
"loss": 0.283,
"step": 33225
},
{
"epoch": 1.33,
"learning_rate": 9.344644644644645e-06,
"loss": 0.2708,
"step": 33250
},
{
"epoch": 1.33,
"learning_rate": 9.344144144144145e-06,
"loss": 0.2549,
"step": 33275
},
{
"epoch": 1.33,
"learning_rate": 9.343643643643644e-06,
"loss": 0.2601,
"step": 33300
},
{
"epoch": 1.33,
"learning_rate": 9.343143143143143e-06,
"loss": 0.2585,
"step": 33325
},
{
"epoch": 1.33,
"learning_rate": 9.342642642642643e-06,
"loss": 0.2794,
"step": 33350
},
{
"epoch": 1.33,
"learning_rate": 9.342142142142144e-06,
"loss": 0.2721,
"step": 33375
},
{
"epoch": 1.33,
"learning_rate": 9.341641641641643e-06,
"loss": 0.278,
"step": 33400
},
{
"epoch": 1.33,
"learning_rate": 9.341141141141142e-06,
"loss": 0.2702,
"step": 33425
},
{
"epoch": 1.33,
"learning_rate": 9.340640640640642e-06,
"loss": 0.2577,
"step": 33450
},
{
"epoch": 1.33,
"learning_rate": 9.34014014014014e-06,
"loss": 0.2706,
"step": 33475
},
{
"epoch": 1.34,
"learning_rate": 9.33963963963964e-06,
"loss": 0.25,
"step": 33500
},
{
"epoch": 1.34,
"learning_rate": 9.33913913913914e-06,
"loss": 0.2774,
"step": 33525
},
{
"epoch": 1.34,
"learning_rate": 9.33863863863864e-06,
"loss": 0.2676,
"step": 33550
},
{
"epoch": 1.34,
"learning_rate": 9.338138138138138e-06,
"loss": 0.2776,
"step": 33575
},
{
"epoch": 1.34,
"learning_rate": 9.337637637637639e-06,
"loss": 0.2542,
"step": 33600
},
{
"epoch": 1.34,
"learning_rate": 9.337137137137138e-06,
"loss": 0.273,
"step": 33625
},
{
"epoch": 1.34,
"learning_rate": 9.336636636636638e-06,
"loss": 0.2498,
"step": 33650
},
{
"epoch": 1.34,
"learning_rate": 9.336136136136137e-06,
"loss": 0.2624,
"step": 33675
},
{
"epoch": 1.34,
"learning_rate": 9.335635635635636e-06,
"loss": 0.255,
"step": 33700
},
{
"epoch": 1.34,
"learning_rate": 9.335135135135135e-06,
"loss": 0.2639,
"step": 33725
},
{
"epoch": 1.35,
"learning_rate": 9.334634634634635e-06,
"loss": 0.281,
"step": 33750
},
{
"epoch": 1.35,
"learning_rate": 9.334134134134136e-06,
"loss": 0.2733,
"step": 33775
},
{
"epoch": 1.35,
"learning_rate": 9.333633633633633e-06,
"loss": 0.2613,
"step": 33800
},
{
"epoch": 1.35,
"learning_rate": 9.333133133133134e-06,
"loss": 0.273,
"step": 33825
},
{
"epoch": 1.35,
"learning_rate": 9.332632632632634e-06,
"loss": 0.264,
"step": 33850
},
{
"epoch": 1.35,
"learning_rate": 9.332132132132133e-06,
"loss": 0.2665,
"step": 33875
},
{
"epoch": 1.35,
"learning_rate": 9.331631631631632e-06,
"loss": 0.264,
"step": 33900
},
{
"epoch": 1.35,
"learning_rate": 9.331131131131132e-06,
"loss": 0.2686,
"step": 33925
},
{
"epoch": 1.35,
"learning_rate": 9.330630630630631e-06,
"loss": 0.2709,
"step": 33950
},
{
"epoch": 1.35,
"learning_rate": 9.33013013013013e-06,
"loss": 0.2731,
"step": 33975
},
{
"epoch": 1.36,
"learning_rate": 9.329629629629631e-06,
"loss": 0.28,
"step": 34000
},
{
"epoch": 1.36,
"eval_loss": 0.44749680161476135,
"eval_runtime": 2532.2254,
"eval_samples_per_second": 6.403,
"eval_steps_per_second": 0.16,
"eval_wer": 26.161531286376142,
"step": 34000
},
{
"epoch": 1.36,
"learning_rate": 9.32912912912913e-06,
"loss": 0.2572,
"step": 34025
},
{
"epoch": 1.36,
"learning_rate": 9.32862862862863e-06,
"loss": 0.2828,
"step": 34050
},
{
"epoch": 1.36,
"learning_rate": 9.328128128128129e-06,
"loss": 0.268,
"step": 34075
},
{
"epoch": 1.36,
"learning_rate": 9.327627627627628e-06,
"loss": 0.2602,
"step": 34100
},
{
"epoch": 1.36,
"learning_rate": 9.327127127127128e-06,
"loss": 0.2651,
"step": 34125
},
{
"epoch": 1.36,
"learning_rate": 9.326626626626627e-06,
"loss": 0.2796,
"step": 34150
},
{
"epoch": 1.36,
"learning_rate": 9.326126126126128e-06,
"loss": 0.2649,
"step": 34175
},
{
"epoch": 1.36,
"learning_rate": 9.325625625625626e-06,
"loss": 0.2729,
"step": 34200
},
{
"epoch": 1.36,
"learning_rate": 9.325125125125127e-06,
"loss": 0.2492,
"step": 34225
},
{
"epoch": 1.37,
"learning_rate": 9.324624624624626e-06,
"loss": 0.2389,
"step": 34250
},
{
"epoch": 1.37,
"learning_rate": 9.324124124124125e-06,
"loss": 0.2584,
"step": 34275
},
{
"epoch": 1.37,
"learning_rate": 9.323623623623624e-06,
"loss": 0.2635,
"step": 34300
},
{
"epoch": 1.37,
"learning_rate": 9.323123123123124e-06,
"loss": 0.2556,
"step": 34325
},
{
"epoch": 1.37,
"learning_rate": 9.322622622622623e-06,
"loss": 0.2661,
"step": 34350
},
{
"epoch": 1.37,
"learning_rate": 9.322122122122122e-06,
"loss": 0.2698,
"step": 34375
},
{
"epoch": 1.37,
"learning_rate": 9.321621621621623e-06,
"loss": 0.2622,
"step": 34400
},
{
"epoch": 1.37,
"learning_rate": 9.321121121121121e-06,
"loss": 0.2606,
"step": 34425
},
{
"epoch": 1.37,
"learning_rate": 9.320620620620622e-06,
"loss": 0.2561,
"step": 34450
},
{
"epoch": 1.37,
"learning_rate": 9.320120120120121e-06,
"loss": 0.2681,
"step": 34475
},
{
"epoch": 1.38,
"learning_rate": 9.31961961961962e-06,
"loss": 0.2686,
"step": 34500
},
{
"epoch": 1.38,
"learning_rate": 9.31911911911912e-06,
"loss": 0.2691,
"step": 34525
},
{
"epoch": 1.38,
"learning_rate": 9.318618618618619e-06,
"loss": 0.2481,
"step": 34550
},
{
"epoch": 1.38,
"learning_rate": 9.318118118118118e-06,
"loss": 0.2579,
"step": 34575
},
{
"epoch": 1.38,
"learning_rate": 9.317617617617618e-06,
"loss": 0.2442,
"step": 34600
},
{
"epoch": 1.38,
"learning_rate": 9.317117117117119e-06,
"loss": 0.2605,
"step": 34625
},
{
"epoch": 1.38,
"learning_rate": 9.316616616616618e-06,
"loss": 0.2717,
"step": 34650
},
{
"epoch": 1.38,
"learning_rate": 9.316116116116117e-06,
"loss": 0.2749,
"step": 34675
},
{
"epoch": 1.38,
"learning_rate": 9.315615615615617e-06,
"loss": 0.2525,
"step": 34700
},
{
"epoch": 1.38,
"learning_rate": 9.315115115115116e-06,
"loss": 0.2586,
"step": 34725
},
{
"epoch": 1.39,
"learning_rate": 9.314614614614615e-06,
"loss": 0.2683,
"step": 34750
},
{
"epoch": 1.39,
"learning_rate": 9.314114114114114e-06,
"loss": 0.2538,
"step": 34775
},
{
"epoch": 1.39,
"learning_rate": 9.313613613613614e-06,
"loss": 0.2354,
"step": 34800
},
{
"epoch": 1.39,
"learning_rate": 9.313113113113113e-06,
"loss": 0.2591,
"step": 34825
},
{
"epoch": 1.39,
"learning_rate": 9.312612612612614e-06,
"loss": 0.28,
"step": 34850
},
{
"epoch": 1.39,
"learning_rate": 9.312112112112113e-06,
"loss": 0.2789,
"step": 34875
},
{
"epoch": 1.39,
"learning_rate": 9.311611611611613e-06,
"loss": 0.2741,
"step": 34900
},
{
"epoch": 1.39,
"learning_rate": 9.311111111111112e-06,
"loss": 0.2803,
"step": 34925
},
{
"epoch": 1.39,
"learning_rate": 9.310610610610611e-06,
"loss": 0.2699,
"step": 34950
},
{
"epoch": 1.39,
"learning_rate": 9.31011011011011e-06,
"loss": 0.2618,
"step": 34975
},
{
"epoch": 1.4,
"learning_rate": 9.30960960960961e-06,
"loss": 0.2775,
"step": 35000
},
{
"epoch": 1.4,
"eval_loss": 0.44763508439064026,
"eval_runtime": 2480.936,
"eval_samples_per_second": 6.535,
"eval_steps_per_second": 0.164,
"eval_wer": 25.96958086971269,
"step": 35000
},
{
"epoch": 1.4,
"learning_rate": 9.30910910910911e-06,
"loss": 0.2801,
"step": 35025
},
{
"epoch": 1.4,
"learning_rate": 9.308608608608608e-06,
"loss": 0.2666,
"step": 35050
},
{
"epoch": 1.4,
"learning_rate": 9.30810810810811e-06,
"loss": 0.2817,
"step": 35075
},
{
"epoch": 1.4,
"learning_rate": 9.307607607607609e-06,
"loss": 0.2618,
"step": 35100
},
{
"epoch": 1.4,
"learning_rate": 9.307107107107108e-06,
"loss": 0.2637,
"step": 35125
},
{
"epoch": 1.4,
"learning_rate": 9.306606606606607e-06,
"loss": 0.2679,
"step": 35150
},
{
"epoch": 1.4,
"learning_rate": 9.306106106106107e-06,
"loss": 0.2729,
"step": 35175
},
{
"epoch": 1.4,
"learning_rate": 9.305605605605606e-06,
"loss": 0.2659,
"step": 35200
},
{
"epoch": 1.4,
"learning_rate": 9.305105105105105e-06,
"loss": 0.2642,
"step": 35225
},
{
"epoch": 1.41,
"learning_rate": 9.304604604604606e-06,
"loss": 0.2607,
"step": 35250
},
{
"epoch": 1.41,
"learning_rate": 9.304104104104105e-06,
"loss": 0.2831,
"step": 35275
},
{
"epoch": 1.41,
"learning_rate": 9.303603603603605e-06,
"loss": 0.2681,
"step": 35300
},
{
"epoch": 1.41,
"learning_rate": 9.303103103103104e-06,
"loss": 0.2611,
"step": 35325
},
{
"epoch": 1.41,
"learning_rate": 9.302602602602603e-06,
"loss": 0.2525,
"step": 35350
},
{
"epoch": 1.41,
"learning_rate": 9.302102102102103e-06,
"loss": 0.2629,
"step": 35375
},
{
"epoch": 1.41,
"learning_rate": 9.301601601601602e-06,
"loss": 0.2576,
"step": 35400
},
{
"epoch": 1.41,
"learning_rate": 9.301101101101101e-06,
"loss": 0.2576,
"step": 35425
},
{
"epoch": 1.41,
"learning_rate": 9.3006006006006e-06,
"loss": 0.2558,
"step": 35450
},
{
"epoch": 1.41,
"learning_rate": 9.300100100100102e-06,
"loss": 0.2591,
"step": 35475
},
{
"epoch": 1.42,
"learning_rate": 9.299599599599601e-06,
"loss": 0.2646,
"step": 35500
},
{
"epoch": 1.42,
"learning_rate": 9.2990990990991e-06,
"loss": 0.2515,
"step": 35525
},
{
"epoch": 1.42,
"learning_rate": 9.2985985985986e-06,
"loss": 0.274,
"step": 35550
},
{
"epoch": 1.42,
"learning_rate": 9.298098098098099e-06,
"loss": 0.2696,
"step": 35575
},
{
"epoch": 1.42,
"learning_rate": 9.297597597597598e-06,
"loss": 0.2637,
"step": 35600
},
{
"epoch": 1.42,
"learning_rate": 9.297097097097097e-06,
"loss": 0.2644,
"step": 35625
},
{
"epoch": 1.42,
"learning_rate": 9.296596596596598e-06,
"loss": 0.262,
"step": 35650
},
{
"epoch": 1.42,
"learning_rate": 9.296096096096096e-06,
"loss": 0.2709,
"step": 35675
},
{
"epoch": 1.42,
"learning_rate": 9.295595595595597e-06,
"loss": 0.263,
"step": 35700
},
{
"epoch": 1.42,
"learning_rate": 9.295095095095096e-06,
"loss": 0.2569,
"step": 35725
},
{
"epoch": 1.43,
"learning_rate": 9.294594594594596e-06,
"loss": 0.2525,
"step": 35750
},
{
"epoch": 1.43,
"learning_rate": 9.294094094094095e-06,
"loss": 0.2584,
"step": 35775
},
{
"epoch": 1.43,
"learning_rate": 9.293593593593594e-06,
"loss": 0.2665,
"step": 35800
},
{
"epoch": 1.43,
"learning_rate": 9.293093093093093e-06,
"loss": 0.2693,
"step": 35825
},
{
"epoch": 1.43,
"learning_rate": 9.292592592592593e-06,
"loss": 0.257,
"step": 35850
},
{
"epoch": 1.43,
"learning_rate": 9.292092092092094e-06,
"loss": 0.2616,
"step": 35875
},
{
"epoch": 1.43,
"learning_rate": 9.291591591591593e-06,
"loss": 0.2711,
"step": 35900
},
{
"epoch": 1.43,
"learning_rate": 9.291091091091092e-06,
"loss": 0.2573,
"step": 35925
},
{
"epoch": 1.43,
"learning_rate": 9.290590590590592e-06,
"loss": 0.2708,
"step": 35950
},
{
"epoch": 1.43,
"learning_rate": 9.290090090090091e-06,
"loss": 0.2423,
"step": 35975
},
{
"epoch": 1.44,
"learning_rate": 9.28958958958959e-06,
"loss": 0.2609,
"step": 36000
},
{
"epoch": 1.44,
"eval_loss": 0.4396921396255493,
"eval_runtime": 2445.1333,
"eval_samples_per_second": 6.631,
"eval_steps_per_second": 0.166,
"eval_wer": 25.296598083579376,
"step": 36000
},
{
"epoch": 1.44,
"learning_rate": 9.28908908908909e-06,
"loss": 0.2572,
"step": 36025
},
{
"epoch": 1.44,
"learning_rate": 9.288588588588589e-06,
"loss": 0.2676,
"step": 36050
},
{
"epoch": 1.44,
"learning_rate": 9.288088088088088e-06,
"loss": 0.2508,
"step": 36075
},
{
"epoch": 1.44,
"learning_rate": 9.287587587587589e-06,
"loss": 0.2714,
"step": 36100
},
{
"epoch": 1.44,
"learning_rate": 9.287087087087088e-06,
"loss": 0.26,
"step": 36125
},
{
"epoch": 1.44,
"learning_rate": 9.286586586586588e-06,
"loss": 0.2648,
"step": 36150
},
{
"epoch": 1.44,
"learning_rate": 9.286086086086087e-06,
"loss": 0.2748,
"step": 36175
},
{
"epoch": 1.44,
"learning_rate": 9.285585585585586e-06,
"loss": 0.2602,
"step": 36200
},
{
"epoch": 1.44,
"learning_rate": 9.285085085085086e-06,
"loss": 0.2658,
"step": 36225
},
{
"epoch": 1.45,
"learning_rate": 9.284584584584585e-06,
"loss": 0.2623,
"step": 36250
},
{
"epoch": 1.45,
"learning_rate": 9.284084084084086e-06,
"loss": 0.2634,
"step": 36275
},
{
"epoch": 1.45,
"learning_rate": 9.283583583583583e-06,
"loss": 0.2832,
"step": 36300
},
{
"epoch": 1.45,
"learning_rate": 9.283083083083084e-06,
"loss": 0.2656,
"step": 36325
},
{
"epoch": 1.45,
"learning_rate": 9.282582582582584e-06,
"loss": 0.2565,
"step": 36350
},
{
"epoch": 1.45,
"learning_rate": 9.282082082082083e-06,
"loss": 0.2542,
"step": 36375
},
{
"epoch": 1.45,
"learning_rate": 9.281581581581582e-06,
"loss": 0.2594,
"step": 36400
},
{
"epoch": 1.45,
"learning_rate": 9.281081081081082e-06,
"loss": 0.2654,
"step": 36425
},
{
"epoch": 1.45,
"learning_rate": 9.280580580580581e-06,
"loss": 0.292,
"step": 36450
},
{
"epoch": 1.45,
"learning_rate": 9.28008008008008e-06,
"loss": 0.282,
"step": 36475
},
{
"epoch": 1.46,
"learning_rate": 9.279579579579581e-06,
"loss": 0.2795,
"step": 36500
},
{
"epoch": 1.46,
"learning_rate": 9.27907907907908e-06,
"loss": 0.263,
"step": 36525
},
{
"epoch": 1.46,
"learning_rate": 9.27857857857858e-06,
"loss": 0.272,
"step": 36550
},
{
"epoch": 1.46,
"learning_rate": 9.278098098098099e-06,
"loss": 0.2498,
"step": 36575
},
{
"epoch": 1.46,
"learning_rate": 9.277597597597598e-06,
"loss": 0.2626,
"step": 36600
},
{
"epoch": 1.46,
"learning_rate": 9.277097097097098e-06,
"loss": 0.2671,
"step": 36625
},
{
"epoch": 1.46,
"learning_rate": 9.276596596596597e-06,
"loss": 0.2622,
"step": 36650
},
{
"epoch": 1.46,
"learning_rate": 9.276096096096096e-06,
"loss": 0.2507,
"step": 36675
},
{
"epoch": 1.46,
"learning_rate": 9.275595595595597e-06,
"loss": 0.2606,
"step": 36700
},
{
"epoch": 1.46,
"learning_rate": 9.275095095095096e-06,
"loss": 0.2716,
"step": 36725
},
{
"epoch": 1.47,
"learning_rate": 9.274594594594596e-06,
"loss": 0.2699,
"step": 36750
},
{
"epoch": 1.47,
"learning_rate": 9.274094094094095e-06,
"loss": 0.2819,
"step": 36775
},
{
"epoch": 1.47,
"learning_rate": 9.273593593593594e-06,
"loss": 0.2681,
"step": 36800
},
{
"epoch": 1.47,
"learning_rate": 9.273093093093094e-06,
"loss": 0.2603,
"step": 36825
},
{
"epoch": 1.47,
"learning_rate": 9.272592592592593e-06,
"loss": 0.2556,
"step": 36850
},
{
"epoch": 1.47,
"learning_rate": 9.272092092092094e-06,
"loss": 0.2798,
"step": 36875
},
{
"epoch": 1.47,
"learning_rate": 9.271591591591592e-06,
"loss": 0.2623,
"step": 36900
},
{
"epoch": 1.47,
"learning_rate": 9.271091091091092e-06,
"loss": 0.2502,
"step": 36925
},
{
"epoch": 1.47,
"learning_rate": 9.270590590590592e-06,
"loss": 0.262,
"step": 36950
},
{
"epoch": 1.47,
"learning_rate": 9.270090090090091e-06,
"loss": 0.2504,
"step": 36975
},
{
"epoch": 1.48,
"learning_rate": 9.26958958958959e-06,
"loss": 0.2681,
"step": 37000
},
{
"epoch": 1.48,
"eval_loss": 0.4397401511669159,
"eval_runtime": 2578.9596,
"eval_samples_per_second": 6.287,
"eval_steps_per_second": 0.157,
"eval_wer": 26.684962342257613,
"step": 37000
},
{
"epoch": 1.48,
"learning_rate": 9.26908908908909e-06,
"loss": 0.2618,
"step": 37025
},
{
"epoch": 1.48,
"learning_rate": 9.268588588588589e-06,
"loss": 0.2717,
"step": 37050
},
{
"epoch": 1.48,
"learning_rate": 9.268088088088088e-06,
"loss": 0.2628,
"step": 37075
},
{
"epoch": 1.48,
"learning_rate": 9.26758758758759e-06,
"loss": 0.262,
"step": 37100
},
{
"epoch": 1.48,
"learning_rate": 9.267087087087087e-06,
"loss": 0.2531,
"step": 37125
},
{
"epoch": 1.48,
"learning_rate": 9.266586586586588e-06,
"loss": 0.2407,
"step": 37150
},
{
"epoch": 1.48,
"learning_rate": 9.266086086086087e-06,
"loss": 0.2717,
"step": 37175
},
{
"epoch": 1.48,
"learning_rate": 9.265585585585586e-06,
"loss": 0.2696,
"step": 37200
},
{
"epoch": 1.48,
"learning_rate": 9.265085085085086e-06,
"loss": 0.2718,
"step": 37225
},
{
"epoch": 1.49,
"learning_rate": 9.264584584584585e-06,
"loss": 0.2523,
"step": 37250
},
{
"epoch": 1.49,
"learning_rate": 9.264084084084084e-06,
"loss": 0.2637,
"step": 37275
},
{
"epoch": 1.49,
"learning_rate": 9.263583583583584e-06,
"loss": 0.2818,
"step": 37300
},
{
"epoch": 1.49,
"learning_rate": 9.263083083083085e-06,
"loss": 0.2812,
"step": 37325
},
{
"epoch": 1.49,
"learning_rate": 9.262582582582584e-06,
"loss": 0.2623,
"step": 37350
},
{
"epoch": 1.49,
"learning_rate": 9.262082082082083e-06,
"loss": 0.2615,
"step": 37375
},
{
"epoch": 1.49,
"learning_rate": 9.261581581581583e-06,
"loss": 0.2783,
"step": 37400
},
{
"epoch": 1.49,
"learning_rate": 9.261081081081082e-06,
"loss": 0.2577,
"step": 37425
},
{
"epoch": 1.49,
"learning_rate": 9.260580580580581e-06,
"loss": 0.2718,
"step": 37450
},
{
"epoch": 1.49,
"learning_rate": 9.26008008008008e-06,
"loss": 0.2569,
"step": 37475
},
{
"epoch": 1.5,
"learning_rate": 9.259579579579581e-06,
"loss": 0.2604,
"step": 37500
},
{
"epoch": 1.5,
"learning_rate": 9.259079079079079e-06,
"loss": 0.265,
"step": 37525
},
{
"epoch": 1.5,
"learning_rate": 9.25857857857858e-06,
"loss": 0.2688,
"step": 37550
},
{
"epoch": 1.5,
"learning_rate": 9.25807807807808e-06,
"loss": 0.2567,
"step": 37575
},
{
"epoch": 1.5,
"learning_rate": 9.257577577577579e-06,
"loss": 0.2747,
"step": 37600
},
{
"epoch": 1.5,
"learning_rate": 9.257077077077078e-06,
"loss": 0.27,
"step": 37625
},
{
"epoch": 1.5,
"learning_rate": 9.256576576576577e-06,
"loss": 0.2699,
"step": 37650
},
{
"epoch": 1.5,
"learning_rate": 9.256076076076076e-06,
"loss": 0.2645,
"step": 37675
},
{
"epoch": 1.5,
"learning_rate": 9.255575575575576e-06,
"loss": 0.2723,
"step": 37700
},
{
"epoch": 1.5,
"learning_rate": 9.255075075075077e-06,
"loss": 0.2693,
"step": 37725
},
{
"epoch": 1.51,
"learning_rate": 9.254574574574574e-06,
"loss": 0.2509,
"step": 37750
},
{
"epoch": 1.51,
"learning_rate": 9.254074074074075e-06,
"loss": 0.2698,
"step": 37775
},
{
"epoch": 1.51,
"learning_rate": 9.253573573573575e-06,
"loss": 0.2359,
"step": 37800
},
{
"epoch": 1.51,
"learning_rate": 9.253073073073074e-06,
"loss": 0.2707,
"step": 37825
},
{
"epoch": 1.51,
"learning_rate": 9.252572572572573e-06,
"loss": 0.2534,
"step": 37850
},
{
"epoch": 1.51,
"learning_rate": 9.252072072072073e-06,
"loss": 0.2554,
"step": 37875
},
{
"epoch": 1.51,
"learning_rate": 9.251571571571572e-06,
"loss": 0.2753,
"step": 37900
},
{
"epoch": 1.51,
"learning_rate": 9.251071071071071e-06,
"loss": 0.2551,
"step": 37925
},
{
"epoch": 1.51,
"learning_rate": 9.250570570570572e-06,
"loss": 0.2576,
"step": 37950
},
{
"epoch": 1.51,
"learning_rate": 9.250070070070071e-06,
"loss": 0.2579,
"step": 37975
},
{
"epoch": 1.52,
"learning_rate": 9.24956956956957e-06,
"loss": 0.2661,
"step": 38000
},
{
"epoch": 1.52,
"eval_loss": 0.4426652491092682,
"eval_runtime": 2522.4342,
"eval_samples_per_second": 6.428,
"eval_steps_per_second": 0.161,
"eval_wer": 25.423023257606708,
"step": 38000
},
{
"epoch": 1.52,
"learning_rate": 9.24906906906907e-06,
"loss": 0.2819,
"step": 38025
},
{
"epoch": 1.52,
"learning_rate": 9.24856856856857e-06,
"loss": 0.2773,
"step": 38050
},
{
"epoch": 1.52,
"learning_rate": 9.248068068068069e-06,
"loss": 0.2604,
"step": 38075
},
{
"epoch": 1.52,
"learning_rate": 9.247567567567568e-06,
"loss": 0.2645,
"step": 38100
},
{
"epoch": 1.52,
"learning_rate": 9.247067067067069e-06,
"loss": 0.2504,
"step": 38125
},
{
"epoch": 1.52,
"learning_rate": 9.246566566566567e-06,
"loss": 0.2731,
"step": 38150
},
{
"epoch": 1.52,
"learning_rate": 9.246066066066068e-06,
"loss": 0.2543,
"step": 38175
},
{
"epoch": 1.52,
"learning_rate": 9.245565565565567e-06,
"loss": 0.2552,
"step": 38200
},
{
"epoch": 1.52,
"learning_rate": 9.245065065065066e-06,
"loss": 0.2789,
"step": 38225
},
{
"epoch": 1.53,
"learning_rate": 9.244564564564565e-06,
"loss": 0.2668,
"step": 38250
},
{
"epoch": 1.53,
"learning_rate": 9.244064064064065e-06,
"loss": 0.2635,
"step": 38275
},
{
"epoch": 1.53,
"learning_rate": 9.243563563563564e-06,
"loss": 0.248,
"step": 38300
},
{
"epoch": 1.53,
"learning_rate": 9.243063063063063e-06,
"loss": 0.2675,
"step": 38325
},
{
"epoch": 1.53,
"learning_rate": 9.242562562562564e-06,
"loss": 0.265,
"step": 38350
},
{
"epoch": 1.53,
"learning_rate": 9.242062062062062e-06,
"loss": 0.2509,
"step": 38375
},
{
"epoch": 1.53,
"learning_rate": 9.241561561561563e-06,
"loss": 0.2535,
"step": 38400
},
{
"epoch": 1.53,
"learning_rate": 9.241061061061062e-06,
"loss": 0.2716,
"step": 38425
},
{
"epoch": 1.53,
"learning_rate": 9.240560560560561e-06,
"loss": 0.2578,
"step": 38450
},
{
"epoch": 1.53,
"learning_rate": 9.24006006006006e-06,
"loss": 0.2743,
"step": 38475
},
{
"epoch": 1.54,
"learning_rate": 9.23955955955956e-06,
"loss": 0.2701,
"step": 38500
},
{
"epoch": 1.54,
"learning_rate": 9.23905905905906e-06,
"loss": 0.2716,
"step": 38525
},
{
"epoch": 1.54,
"learning_rate": 9.238558558558559e-06,
"loss": 0.2696,
"step": 38550
},
{
"epoch": 1.54,
"learning_rate": 9.23805805805806e-06,
"loss": 0.2701,
"step": 38575
},
{
"epoch": 1.54,
"learning_rate": 9.237577577577577e-06,
"loss": 0.2573,
"step": 38600
},
{
"epoch": 1.54,
"learning_rate": 9.237077077077078e-06,
"loss": 0.2641,
"step": 38625
},
{
"epoch": 1.54,
"learning_rate": 9.236576576576577e-06,
"loss": 0.277,
"step": 38650
},
{
"epoch": 1.54,
"learning_rate": 9.236076076076077e-06,
"loss": 0.2562,
"step": 38675
},
{
"epoch": 1.54,
"learning_rate": 9.235575575575576e-06,
"loss": 0.2584,
"step": 38700
},
{
"epoch": 1.54,
"learning_rate": 9.235075075075077e-06,
"loss": 0.2571,
"step": 38725
},
{
"epoch": 1.55,
"learning_rate": 9.234574574574575e-06,
"loss": 0.2652,
"step": 38750
},
{
"epoch": 1.55,
"learning_rate": 9.234074074074076e-06,
"loss": 0.26,
"step": 38775
},
{
"epoch": 1.55,
"learning_rate": 9.233573573573575e-06,
"loss": 0.2475,
"step": 38800
},
{
"epoch": 1.55,
"learning_rate": 9.233073073073074e-06,
"loss": 0.2728,
"step": 38825
},
{
"epoch": 1.55,
"learning_rate": 9.232572572572573e-06,
"loss": 0.2678,
"step": 38850
},
{
"epoch": 1.55,
"learning_rate": 9.232072072072073e-06,
"loss": 0.2597,
"step": 38875
},
{
"epoch": 1.55,
"learning_rate": 9.231571571571572e-06,
"loss": 0.2532,
"step": 38900
},
{
"epoch": 1.55,
"learning_rate": 9.231071071071071e-06,
"loss": 0.2552,
"step": 38925
},
{
"epoch": 1.55,
"learning_rate": 9.230570570570572e-06,
"loss": 0.2528,
"step": 38950
},
{
"epoch": 1.55,
"learning_rate": 9.23007007007007e-06,
"loss": 0.2356,
"step": 38975
},
{
"epoch": 1.56,
"learning_rate": 9.229569569569571e-06,
"loss": 0.2512,
"step": 39000
},
{
"epoch": 1.56,
"eval_loss": 0.4447844326496124,
"eval_runtime": 2535.3087,
"eval_samples_per_second": 6.395,
"eval_steps_per_second": 0.16,
"eval_wer": 26.18311607218569,
"step": 39000
},
{
"epoch": 1.56,
"learning_rate": 9.22906906906907e-06,
"loss": 0.28,
"step": 39025
},
{
"epoch": 1.56,
"learning_rate": 9.22856856856857e-06,
"loss": 0.2598,
"step": 39050
},
{
"epoch": 1.56,
"learning_rate": 9.228068068068069e-06,
"loss": 0.2805,
"step": 39075
},
{
"epoch": 1.56,
"learning_rate": 9.227567567567568e-06,
"loss": 0.2677,
"step": 39100
},
{
"epoch": 1.56,
"learning_rate": 9.227067067067067e-06,
"loss": 0.2749,
"step": 39125
},
{
"epoch": 1.56,
"learning_rate": 9.226566566566567e-06,
"loss": 0.2652,
"step": 39150
},
{
"epoch": 1.56,
"learning_rate": 9.226066066066068e-06,
"loss": 0.2609,
"step": 39175
},
{
"epoch": 1.56,
"learning_rate": 9.225565565565567e-06,
"loss": 0.2656,
"step": 39200
},
{
"epoch": 1.56,
"learning_rate": 9.225065065065065e-06,
"loss": 0.2648,
"step": 39225
},
{
"epoch": 1.57,
"learning_rate": 9.224564564564566e-06,
"loss": 0.2567,
"step": 39250
},
{
"epoch": 1.57,
"learning_rate": 9.224064064064065e-06,
"loss": 0.2433,
"step": 39275
},
{
"epoch": 1.57,
"learning_rate": 9.223563563563564e-06,
"loss": 0.276,
"step": 39300
},
{
"epoch": 1.57,
"learning_rate": 9.223063063063064e-06,
"loss": 0.2651,
"step": 39325
},
{
"epoch": 1.57,
"learning_rate": 9.222562562562564e-06,
"loss": 0.2591,
"step": 39350
},
{
"epoch": 1.57,
"learning_rate": 9.222062062062062e-06,
"loss": 0.2616,
"step": 39375
},
{
"epoch": 1.57,
"learning_rate": 9.221561561561563e-06,
"loss": 0.2563,
"step": 39400
},
{
"epoch": 1.57,
"learning_rate": 9.221061061061062e-06,
"loss": 0.2595,
"step": 39425
},
{
"epoch": 1.57,
"learning_rate": 9.22056056056056e-06,
"loss": 0.2646,
"step": 39450
},
{
"epoch": 1.57,
"learning_rate": 9.220060060060061e-06,
"loss": 0.2676,
"step": 39475
},
{
"epoch": 1.58,
"learning_rate": 9.21955955955956e-06,
"loss": 0.2585,
"step": 39500
},
{
"epoch": 1.58,
"learning_rate": 9.21905905905906e-06,
"loss": 0.2599,
"step": 39525
},
{
"epoch": 1.58,
"learning_rate": 9.218558558558559e-06,
"loss": 0.2477,
"step": 39550
},
{
"epoch": 1.58,
"learning_rate": 9.21805805805806e-06,
"loss": 0.2376,
"step": 39575
},
{
"epoch": 1.58,
"learning_rate": 9.217557557557557e-06,
"loss": 0.2491,
"step": 39600
},
{
"epoch": 1.58,
"learning_rate": 9.217057057057058e-06,
"loss": 0.2533,
"step": 39625
},
{
"epoch": 1.58,
"learning_rate": 9.216556556556558e-06,
"loss": 0.2646,
"step": 39650
},
{
"epoch": 1.58,
"learning_rate": 9.216056056056057e-06,
"loss": 0.2824,
"step": 39675
},
{
"epoch": 1.58,
"learning_rate": 9.215555555555556e-06,
"loss": 0.2854,
"step": 39700
},
{
"epoch": 1.58,
"learning_rate": 9.215055055055056e-06,
"loss": 0.2553,
"step": 39725
},
{
"epoch": 1.59,
"learning_rate": 9.214554554554555e-06,
"loss": 0.2484,
"step": 39750
},
{
"epoch": 1.59,
"learning_rate": 9.214054054054054e-06,
"loss": 0.2362,
"step": 39775
},
{
"epoch": 1.59,
"learning_rate": 9.213553553553555e-06,
"loss": 0.2634,
"step": 39800
},
{
"epoch": 1.59,
"learning_rate": 9.213053053053055e-06,
"loss": 0.2554,
"step": 39825
},
{
"epoch": 1.59,
"learning_rate": 9.212552552552552e-06,
"loss": 0.2502,
"step": 39850
},
{
"epoch": 1.59,
"learning_rate": 9.212052052052053e-06,
"loss": 0.2546,
"step": 39875
},
{
"epoch": 1.59,
"learning_rate": 9.211551551551552e-06,
"loss": 0.2723,
"step": 39900
},
{
"epoch": 1.59,
"learning_rate": 9.211051051051052e-06,
"loss": 0.2674,
"step": 39925
},
{
"epoch": 1.59,
"learning_rate": 9.210550550550551e-06,
"loss": 0.2688,
"step": 39950
},
{
"epoch": 1.59,
"learning_rate": 9.21005005005005e-06,
"loss": 0.2512,
"step": 39975
},
{
"epoch": 1.6,
"learning_rate": 9.20954954954955e-06,
"loss": 0.2541,
"step": 40000
},
{
"epoch": 1.6,
"eval_loss": 0.4458891749382019,
"eval_runtime": 2617.6449,
"eval_samples_per_second": 6.194,
"eval_steps_per_second": 0.155,
"eval_wer": 26.314937442665414,
"step": 40000
},
{
"epoch": 1.6,
"learning_rate": 9.20904904904905e-06,
"loss": 0.2547,
"step": 40025
},
{
"epoch": 1.6,
"learning_rate": 9.20854854854855e-06,
"loss": 0.2557,
"step": 40050
},
{
"epoch": 1.6,
"learning_rate": 9.208048048048048e-06,
"loss": 0.2526,
"step": 40075
},
{
"epoch": 1.6,
"learning_rate": 9.207547547547549e-06,
"loss": 0.2709,
"step": 40100
},
{
"epoch": 1.6,
"learning_rate": 9.207047047047048e-06,
"loss": 0.2643,
"step": 40125
},
{
"epoch": 1.6,
"learning_rate": 9.206546546546547e-06,
"loss": 0.2716,
"step": 40150
},
{
"epoch": 1.6,
"learning_rate": 9.206046046046046e-06,
"loss": 0.2725,
"step": 40175
},
{
"epoch": 1.6,
"learning_rate": 9.205545545545547e-06,
"loss": 0.2532,
"step": 40200
},
{
"epoch": 1.6,
"learning_rate": 9.205045045045045e-06,
"loss": 0.2595,
"step": 40225
},
{
"epoch": 1.61,
"learning_rate": 9.204544544544546e-06,
"loss": 0.2619,
"step": 40250
},
{
"epoch": 1.61,
"learning_rate": 9.204044044044045e-06,
"loss": 0.2627,
"step": 40275
},
{
"epoch": 1.61,
"learning_rate": 9.203543543543545e-06,
"loss": 0.2581,
"step": 40300
},
{
"epoch": 1.61,
"learning_rate": 9.203043043043044e-06,
"loss": 0.2634,
"step": 40325
},
{
"epoch": 1.61,
"learning_rate": 9.202542542542543e-06,
"loss": 0.2392,
"step": 40350
},
{
"epoch": 1.61,
"learning_rate": 9.202042042042042e-06,
"loss": 0.2694,
"step": 40375
},
{
"epoch": 1.61,
"learning_rate": 9.201541541541542e-06,
"loss": 0.2596,
"step": 40400
},
{
"epoch": 1.61,
"learning_rate": 9.201041041041043e-06,
"loss": 0.2844,
"step": 40425
},
{
"epoch": 1.61,
"learning_rate": 9.200540540540542e-06,
"loss": 0.2679,
"step": 40450
},
{
"epoch": 1.61,
"learning_rate": 9.20004004004004e-06,
"loss": 0.2592,
"step": 40475
},
{
"epoch": 1.62,
"learning_rate": 9.19953953953954e-06,
"loss": 0.2523,
"step": 40500
},
{
"epoch": 1.62,
"learning_rate": 9.19903903903904e-06,
"loss": 0.27,
"step": 40525
},
{
"epoch": 1.62,
"learning_rate": 9.19853853853854e-06,
"loss": 0.272,
"step": 40550
},
{
"epoch": 1.62,
"learning_rate": 9.198038038038039e-06,
"loss": 0.2621,
"step": 40575
},
{
"epoch": 1.62,
"learning_rate": 9.197537537537538e-06,
"loss": 0.262,
"step": 40600
},
{
"epoch": 1.62,
"learning_rate": 9.197057057057059e-06,
"loss": 0.2642,
"step": 40625
},
{
"epoch": 1.62,
"learning_rate": 9.196556556556558e-06,
"loss": 0.278,
"step": 40650
},
{
"epoch": 1.62,
"learning_rate": 9.196056056056056e-06,
"loss": 0.2711,
"step": 40675
},
{
"epoch": 1.62,
"learning_rate": 9.195555555555557e-06,
"loss": 0.2728,
"step": 40700
},
{
"epoch": 1.62,
"learning_rate": 9.195055055055056e-06,
"loss": 0.2844,
"step": 40725
},
{
"epoch": 1.63,
"learning_rate": 9.194554554554555e-06,
"loss": 0.2657,
"step": 40750
},
{
"epoch": 1.63,
"learning_rate": 9.194054054054054e-06,
"loss": 0.2559,
"step": 40775
},
{
"epoch": 1.63,
"learning_rate": 9.193553553553555e-06,
"loss": 0.2671,
"step": 40800
},
{
"epoch": 1.63,
"learning_rate": 9.193053053053053e-06,
"loss": 0.2559,
"step": 40825
},
{
"epoch": 1.63,
"learning_rate": 9.192552552552554e-06,
"loss": 0.2546,
"step": 40850
},
{
"epoch": 1.63,
"learning_rate": 9.192052052052053e-06,
"loss": 0.2607,
"step": 40875
},
{
"epoch": 1.63,
"learning_rate": 9.191551551551553e-06,
"loss": 0.2718,
"step": 40900
},
{
"epoch": 1.63,
"learning_rate": 9.191051051051052e-06,
"loss": 0.2672,
"step": 40925
},
{
"epoch": 1.63,
"learning_rate": 9.190550550550551e-06,
"loss": 0.2682,
"step": 40950
},
{
"epoch": 1.63,
"learning_rate": 9.19005005005005e-06,
"loss": 0.2646,
"step": 40975
},
{
"epoch": 1.64,
"learning_rate": 9.18954954954955e-06,
"loss": 0.2535,
"step": 41000
},
{
"epoch": 1.64,
"eval_loss": 0.44114458560943604,
"eval_runtime": 2473.7687,
"eval_samples_per_second": 6.554,
"eval_steps_per_second": 0.164,
"eval_wer": 25.31355755814402,
"step": 41000
},
{
"epoch": 1.64,
"learning_rate": 9.18904904904905e-06,
"loss": 0.2634,
"step": 41025
},
{
"epoch": 1.64,
"learning_rate": 9.18854854854855e-06,
"loss": 0.2616,
"step": 41050
},
{
"epoch": 1.64,
"learning_rate": 9.188048048048048e-06,
"loss": 0.266,
"step": 41075
},
{
"epoch": 1.64,
"learning_rate": 9.187547547547549e-06,
"loss": 0.264,
"step": 41100
},
{
"epoch": 1.64,
"learning_rate": 9.187047047047048e-06,
"loss": 0.2604,
"step": 41125
},
{
"epoch": 1.64,
"learning_rate": 9.186546546546547e-06,
"loss": 0.2552,
"step": 41150
},
{
"epoch": 1.64,
"learning_rate": 9.186046046046047e-06,
"loss": 0.2539,
"step": 41175
},
{
"epoch": 1.64,
"learning_rate": 9.185545545545546e-06,
"loss": 0.2854,
"step": 41200
},
{
"epoch": 1.64,
"learning_rate": 9.185045045045045e-06,
"loss": 0.2629,
"step": 41225
},
{
"epoch": 1.64,
"learning_rate": 9.184544544544546e-06,
"loss": 0.2613,
"step": 41250
},
{
"epoch": 1.65,
"learning_rate": 9.184044044044045e-06,
"loss": 0.2561,
"step": 41275
},
{
"epoch": 1.65,
"learning_rate": 9.183543543543543e-06,
"loss": 0.2617,
"step": 41300
},
{
"epoch": 1.65,
"learning_rate": 9.183043043043044e-06,
"loss": 0.2573,
"step": 41325
},
{
"epoch": 1.65,
"learning_rate": 9.182542542542543e-06,
"loss": 0.2622,
"step": 41350
},
{
"epoch": 1.65,
"learning_rate": 9.182042042042043e-06,
"loss": 0.2472,
"step": 41375
},
{
"epoch": 1.65,
"learning_rate": 9.181541541541542e-06,
"loss": 0.262,
"step": 41400
},
{
"epoch": 1.65,
"learning_rate": 9.181041041041043e-06,
"loss": 0.2558,
"step": 41425
},
{
"epoch": 1.65,
"learning_rate": 9.18054054054054e-06,
"loss": 0.2572,
"step": 41450
},
{
"epoch": 1.65,
"learning_rate": 9.180040040040042e-06,
"loss": 0.2618,
"step": 41475
},
{
"epoch": 1.65,
"learning_rate": 9.17953953953954e-06,
"loss": 0.2532,
"step": 41500
},
{
"epoch": 1.66,
"learning_rate": 9.17903903903904e-06,
"loss": 0.2522,
"step": 41525
},
{
"epoch": 1.66,
"learning_rate": 9.17853853853854e-06,
"loss": 0.275,
"step": 41550
},
{
"epoch": 1.66,
"learning_rate": 9.178038038038039e-06,
"loss": 0.2754,
"step": 41575
},
{
"epoch": 1.66,
"learning_rate": 9.177537537537538e-06,
"loss": 0.2599,
"step": 41600
},
{
"epoch": 1.66,
"learning_rate": 9.177037037037037e-06,
"loss": 0.2509,
"step": 41625
},
{
"epoch": 1.66,
"learning_rate": 9.176536536536538e-06,
"loss": 0.2554,
"step": 41650
},
{
"epoch": 1.66,
"learning_rate": 9.176036036036036e-06,
"loss": 0.2426,
"step": 41675
},
{
"epoch": 1.66,
"learning_rate": 9.175535535535535e-06,
"loss": 0.2675,
"step": 41700
},
{
"epoch": 1.66,
"learning_rate": 9.175035035035036e-06,
"loss": 0.2559,
"step": 41725
},
{
"epoch": 1.66,
"learning_rate": 9.174534534534536e-06,
"loss": 0.2716,
"step": 41750
},
{
"epoch": 1.67,
"learning_rate": 9.174034034034035e-06,
"loss": 0.2686,
"step": 41775
},
{
"epoch": 1.67,
"learning_rate": 9.173533533533534e-06,
"loss": 0.259,
"step": 41800
},
{
"epoch": 1.67,
"learning_rate": 9.173033033033033e-06,
"loss": 0.2747,
"step": 41825
},
{
"epoch": 1.67,
"learning_rate": 9.172532532532533e-06,
"loss": 0.2507,
"step": 41850
},
{
"epoch": 1.67,
"learning_rate": 9.172032032032034e-06,
"loss": 0.2573,
"step": 41875
},
{
"epoch": 1.67,
"learning_rate": 9.171531531531533e-06,
"loss": 0.2542,
"step": 41900
},
{
"epoch": 1.67,
"learning_rate": 9.17103103103103e-06,
"loss": 0.2584,
"step": 41925
},
{
"epoch": 1.67,
"learning_rate": 9.170530530530532e-06,
"loss": 0.2459,
"step": 41950
},
{
"epoch": 1.67,
"learning_rate": 9.170030030030031e-06,
"loss": 0.2533,
"step": 41975
},
{
"epoch": 1.67,
"learning_rate": 9.16952952952953e-06,
"loss": 0.2518,
"step": 42000
},
{
"epoch": 1.67,
"eval_loss": 0.42200759053230286,
"eval_runtime": 2416.12,
"eval_samples_per_second": 6.71,
"eval_steps_per_second": 0.168,
"eval_wer": 24.71689240755159,
"step": 42000
},
{
"epoch": 1.68,
"learning_rate": 9.16902902902903e-06,
"loss": 0.2759,
"step": 42025
},
{
"epoch": 1.68,
"learning_rate": 9.16852852852853e-06,
"loss": 0.258,
"step": 42050
},
{
"epoch": 1.68,
"learning_rate": 9.168028028028028e-06,
"loss": 0.2424,
"step": 42075
},
{
"epoch": 1.68,
"learning_rate": 9.167527527527527e-06,
"loss": 0.258,
"step": 42100
},
{
"epoch": 1.68,
"learning_rate": 9.167027027027028e-06,
"loss": 0.274,
"step": 42125
},
{
"epoch": 1.68,
"learning_rate": 9.166526526526528e-06,
"loss": 0.2479,
"step": 42150
},
{
"epoch": 1.68,
"learning_rate": 9.166026026026027e-06,
"loss": 0.2697,
"step": 42175
},
{
"epoch": 1.68,
"learning_rate": 9.165525525525526e-06,
"loss": 0.2621,
"step": 42200
},
{
"epoch": 1.68,
"learning_rate": 9.165025025025026e-06,
"loss": 0.2645,
"step": 42225
},
{
"epoch": 1.68,
"learning_rate": 9.164524524524525e-06,
"loss": 0.2624,
"step": 42250
},
{
"epoch": 1.69,
"learning_rate": 9.164024024024026e-06,
"loss": 0.2592,
"step": 42275
},
{
"epoch": 1.69,
"learning_rate": 9.163523523523523e-06,
"loss": 0.255,
"step": 42300
},
{
"epoch": 1.69,
"learning_rate": 9.163023023023023e-06,
"loss": 0.262,
"step": 42325
},
{
"epoch": 1.69,
"learning_rate": 9.162522522522524e-06,
"loss": 0.2687,
"step": 42350
},
{
"epoch": 1.69,
"learning_rate": 9.162022022022023e-06,
"loss": 0.2566,
"step": 42375
},
{
"epoch": 1.69,
"learning_rate": 9.161521521521522e-06,
"loss": 0.2563,
"step": 42400
},
{
"epoch": 1.69,
"learning_rate": 9.161021021021022e-06,
"loss": 0.2559,
"step": 42425
},
{
"epoch": 1.69,
"learning_rate": 9.160520520520521e-06,
"loss": 0.2641,
"step": 42450
},
{
"epoch": 1.69,
"learning_rate": 9.16002002002002e-06,
"loss": 0.2729,
"step": 42475
},
{
"epoch": 1.69,
"learning_rate": 9.159519519519521e-06,
"loss": 0.2531,
"step": 42500
},
{
"epoch": 1.7,
"learning_rate": 9.15901901901902e-06,
"loss": 0.2819,
"step": 42525
},
{
"epoch": 1.7,
"learning_rate": 9.158518518518518e-06,
"loss": 0.2594,
"step": 42550
},
{
"epoch": 1.7,
"learning_rate": 9.158018018018019e-06,
"loss": 0.2649,
"step": 42575
},
{
"epoch": 1.7,
"learning_rate": 9.157517517517518e-06,
"loss": 0.2593,
"step": 42600
},
{
"epoch": 1.7,
"learning_rate": 9.157017017017018e-06,
"loss": 0.2636,
"step": 42625
},
{
"epoch": 1.7,
"learning_rate": 9.156536536536539e-06,
"loss": 0.2698,
"step": 42650
},
{
"epoch": 1.7,
"learning_rate": 9.156036036036036e-06,
"loss": 0.254,
"step": 42675
},
{
"epoch": 1.7,
"learning_rate": 9.155535535535535e-06,
"loss": 0.2356,
"step": 42700
},
{
"epoch": 1.7,
"learning_rate": 9.155035035035036e-06,
"loss": 0.2506,
"step": 42725
},
{
"epoch": 1.7,
"learning_rate": 9.154534534534536e-06,
"loss": 0.2669,
"step": 42750
},
{
"epoch": 1.71,
"learning_rate": 9.154034034034035e-06,
"loss": 0.2576,
"step": 42775
},
{
"epoch": 1.71,
"learning_rate": 9.153533533533534e-06,
"loss": 0.2536,
"step": 42800
},
{
"epoch": 1.71,
"learning_rate": 9.153033033033034e-06,
"loss": 0.2686,
"step": 42825
},
{
"epoch": 1.71,
"learning_rate": 9.152532532532533e-06,
"loss": 0.2511,
"step": 42850
},
{
"epoch": 1.71,
"learning_rate": 9.152032032032034e-06,
"loss": 0.2667,
"step": 42875
},
{
"epoch": 1.71,
"learning_rate": 9.151531531531531e-06,
"loss": 0.2593,
"step": 42900
},
{
"epoch": 1.71,
"learning_rate": 9.15103103103103e-06,
"loss": 0.2656,
"step": 42925
},
{
"epoch": 1.71,
"learning_rate": 9.150530530530532e-06,
"loss": 0.2574,
"step": 42950
},
{
"epoch": 1.71,
"learning_rate": 9.150030030030031e-06,
"loss": 0.2557,
"step": 42975
},
{
"epoch": 1.71,
"learning_rate": 9.14952952952953e-06,
"loss": 0.255,
"step": 43000
},
{
"epoch": 1.71,
"eval_loss": 0.43135425448417664,
"eval_runtime": 2587.1846,
"eval_samples_per_second": 6.267,
"eval_steps_per_second": 0.157,
"eval_wer": 25.259595593620155,
"step": 43000
},
{
"epoch": 1.72,
"learning_rate": 9.14902902902903e-06,
"loss": 0.2639,
"step": 43025
},
{
"epoch": 1.72,
"learning_rate": 9.148528528528529e-06,
"loss": 0.256,
"step": 43050
},
{
"epoch": 1.72,
"learning_rate": 9.148028028028028e-06,
"loss": 0.2588,
"step": 43075
},
{
"epoch": 1.72,
"learning_rate": 9.14752752752753e-06,
"loss": 0.2768,
"step": 43100
},
{
"epoch": 1.72,
"learning_rate": 9.147027027027029e-06,
"loss": 0.2557,
"step": 43125
},
{
"epoch": 1.72,
"learning_rate": 9.146526526526526e-06,
"loss": 0.2506,
"step": 43150
},
{
"epoch": 1.72,
"learning_rate": 9.146026026026027e-06,
"loss": 0.2495,
"step": 43175
},
{
"epoch": 1.72,
"learning_rate": 9.145525525525526e-06,
"loss": 0.2652,
"step": 43200
},
{
"epoch": 1.72,
"learning_rate": 9.145025025025026e-06,
"loss": 0.2525,
"step": 43225
},
{
"epoch": 1.72,
"learning_rate": 9.144524524524525e-06,
"loss": 0.2694,
"step": 43250
},
{
"epoch": 1.73,
"learning_rate": 9.144024024024026e-06,
"loss": 0.2489,
"step": 43275
},
{
"epoch": 1.73,
"learning_rate": 9.143523523523524e-06,
"loss": 0.2531,
"step": 43300
},
{
"epoch": 1.73,
"learning_rate": 9.143023023023023e-06,
"loss": 0.2549,
"step": 43325
},
{
"epoch": 1.73,
"learning_rate": 9.142522522522524e-06,
"loss": 0.2526,
"step": 43350
},
{
"epoch": 1.73,
"learning_rate": 9.142022022022023e-06,
"loss": 0.2604,
"step": 43375
},
{
"epoch": 1.73,
"learning_rate": 9.141521521521523e-06,
"loss": 0.2683,
"step": 43400
},
{
"epoch": 1.73,
"learning_rate": 9.141021021021022e-06,
"loss": 0.2659,
"step": 43425
},
{
"epoch": 1.73,
"learning_rate": 9.140520520520521e-06,
"loss": 0.2569,
"step": 43450
},
{
"epoch": 1.73,
"learning_rate": 9.14002002002002e-06,
"loss": 0.2556,
"step": 43475
},
{
"epoch": 1.73,
"learning_rate": 9.139519519519521e-06,
"loss": 0.2752,
"step": 43500
},
{
"epoch": 1.74,
"learning_rate": 9.139019019019019e-06,
"loss": 0.2562,
"step": 43525
},
{
"epoch": 1.74,
"learning_rate": 9.138518518518518e-06,
"loss": 0.2848,
"step": 43550
},
{
"epoch": 1.74,
"learning_rate": 9.13801801801802e-06,
"loss": 0.2598,
"step": 43575
},
{
"epoch": 1.74,
"learning_rate": 9.137517517517519e-06,
"loss": 0.2663,
"step": 43600
},
{
"epoch": 1.74,
"learning_rate": 9.137017017017018e-06,
"loss": 0.2582,
"step": 43625
},
{
"epoch": 1.74,
"learning_rate": 9.136516516516517e-06,
"loss": 0.2646,
"step": 43650
},
{
"epoch": 1.74,
"learning_rate": 9.136016016016016e-06,
"loss": 0.2623,
"step": 43675
},
{
"epoch": 1.74,
"learning_rate": 9.135515515515516e-06,
"loss": 0.2569,
"step": 43700
},
{
"epoch": 1.74,
"learning_rate": 9.135015015015017e-06,
"loss": 0.2504,
"step": 43725
},
{
"epoch": 1.74,
"learning_rate": 9.134514514514516e-06,
"loss": 0.2726,
"step": 43750
},
{
"epoch": 1.75,
"learning_rate": 9.134014014014014e-06,
"loss": 0.2593,
"step": 43775
},
{
"epoch": 1.75,
"learning_rate": 9.133513513513515e-06,
"loss": 0.2478,
"step": 43800
},
{
"epoch": 1.75,
"learning_rate": 9.133013013013014e-06,
"loss": 0.2582,
"step": 43825
},
{
"epoch": 1.75,
"learning_rate": 9.132512512512513e-06,
"loss": 0.2646,
"step": 43850
},
{
"epoch": 1.75,
"learning_rate": 9.132012012012013e-06,
"loss": 0.2822,
"step": 43875
},
{
"epoch": 1.75,
"learning_rate": 9.131511511511514e-06,
"loss": 0.2379,
"step": 43900
},
{
"epoch": 1.75,
"learning_rate": 9.131011011011011e-06,
"loss": 0.2728,
"step": 43925
},
{
"epoch": 1.75,
"learning_rate": 9.13051051051051e-06,
"loss": 0.274,
"step": 43950
},
{
"epoch": 1.75,
"learning_rate": 9.130010010010011e-06,
"loss": 0.2838,
"step": 43975
},
{
"epoch": 1.75,
"learning_rate": 9.129509509509509e-06,
"loss": 0.2639,
"step": 44000
},
{
"epoch": 1.75,
"eval_loss": 0.43265146017074585,
"eval_runtime": 2614.8693,
"eval_samples_per_second": 6.2,
"eval_steps_per_second": 0.155,
"eval_wer": 25.521696564164632,
"step": 44000
},
{
"epoch": 1.76,
"learning_rate": 9.12900900900901e-06,
"loss": 0.2588,
"step": 44025
},
{
"epoch": 1.76,
"learning_rate": 9.12850850850851e-06,
"loss": 0.2764,
"step": 44050
},
{
"epoch": 1.76,
"learning_rate": 9.128008008008009e-06,
"loss": 0.263,
"step": 44075
},
{
"epoch": 1.76,
"learning_rate": 9.127507507507508e-06,
"loss": 0.2644,
"step": 44100
},
{
"epoch": 1.76,
"learning_rate": 9.127007007007009e-06,
"loss": 0.2476,
"step": 44125
},
{
"epoch": 1.76,
"learning_rate": 9.126506506506507e-06,
"loss": 0.2604,
"step": 44150
},
{
"epoch": 1.76,
"learning_rate": 9.126006006006006e-06,
"loss": 0.2747,
"step": 44175
},
{
"epoch": 1.76,
"learning_rate": 9.125505505505507e-06,
"loss": 0.265,
"step": 44200
},
{
"epoch": 1.76,
"learning_rate": 9.125005005005006e-06,
"loss": 0.2568,
"step": 44225
},
{
"epoch": 1.76,
"learning_rate": 9.124504504504505e-06,
"loss": 0.2485,
"step": 44250
},
{
"epoch": 1.77,
"learning_rate": 9.124004004004005e-06,
"loss": 0.2742,
"step": 44275
},
{
"epoch": 1.77,
"learning_rate": 9.123503503503504e-06,
"loss": 0.2634,
"step": 44300
},
{
"epoch": 1.77,
"learning_rate": 9.123003003003003e-06,
"loss": 0.2805,
"step": 44325
},
{
"epoch": 1.77,
"learning_rate": 9.122502502502504e-06,
"loss": 0.2543,
"step": 44350
},
{
"epoch": 1.77,
"learning_rate": 9.122002002002004e-06,
"loss": 0.2753,
"step": 44375
},
{
"epoch": 1.77,
"learning_rate": 9.121501501501501e-06,
"loss": 0.2607,
"step": 44400
},
{
"epoch": 1.77,
"learning_rate": 9.121001001001002e-06,
"loss": 0.242,
"step": 44425
},
{
"epoch": 1.77,
"learning_rate": 9.120500500500501e-06,
"loss": 0.2633,
"step": 44450
},
{
"epoch": 1.77,
"learning_rate": 9.12e-06,
"loss": 0.2686,
"step": 44475
},
{
"epoch": 1.77,
"learning_rate": 9.1194994994995e-06,
"loss": 0.2608,
"step": 44500
},
{
"epoch": 1.78,
"learning_rate": 9.118998998999e-06,
"loss": 0.2779,
"step": 44525
},
{
"epoch": 1.78,
"learning_rate": 9.118498498498499e-06,
"loss": 0.2648,
"step": 44550
},
{
"epoch": 1.78,
"learning_rate": 9.117997997997998e-06,
"loss": 0.2701,
"step": 44575
},
{
"epoch": 1.78,
"learning_rate": 9.117497497497499e-06,
"loss": 0.245,
"step": 44600
},
{
"epoch": 1.78,
"learning_rate": 9.116996996996997e-06,
"loss": 0.2607,
"step": 44625
},
{
"epoch": 1.78,
"learning_rate": 9.116516516516517e-06,
"loss": 0.2622,
"step": 44650
},
{
"epoch": 1.78,
"learning_rate": 9.116016016016017e-06,
"loss": 0.2466,
"step": 44675
},
{
"epoch": 1.78,
"learning_rate": 9.115515515515516e-06,
"loss": 0.2627,
"step": 44700
},
{
"epoch": 1.78,
"learning_rate": 9.115015015015017e-06,
"loss": 0.26,
"step": 44725
},
{
"epoch": 1.78,
"learning_rate": 9.114514514514515e-06,
"loss": 0.2837,
"step": 44750
},
{
"epoch": 1.79,
"learning_rate": 9.114014014014014e-06,
"loss": 0.2417,
"step": 44775
},
{
"epoch": 1.79,
"learning_rate": 9.113513513513515e-06,
"loss": 0.2663,
"step": 44800
},
{
"epoch": 1.79,
"learning_rate": 9.113013013013014e-06,
"loss": 0.2606,
"step": 44825
},
{
"epoch": 1.79,
"learning_rate": 9.112512512512513e-06,
"loss": 0.2416,
"step": 44850
},
{
"epoch": 1.79,
"learning_rate": 9.112012012012013e-06,
"loss": 0.2537,
"step": 44875
},
{
"epoch": 1.79,
"learning_rate": 9.111511511511512e-06,
"loss": 0.2587,
"step": 44900
},
{
"epoch": 1.79,
"learning_rate": 9.111011011011011e-06,
"loss": 0.2658,
"step": 44925
},
{
"epoch": 1.79,
"learning_rate": 9.11051051051051e-06,
"loss": 0.2653,
"step": 44950
},
{
"epoch": 1.79,
"learning_rate": 9.110010010010012e-06,
"loss": 0.2643,
"step": 44975
},
{
"epoch": 1.79,
"learning_rate": 9.10950950950951e-06,
"loss": 0.2638,
"step": 45000
},
{
"epoch": 1.79,
"eval_loss": 0.432108074426651,
"eval_runtime": 2486.7031,
"eval_samples_per_second": 6.52,
"eval_steps_per_second": 0.163,
"eval_wer": 24.733851882116234,
"step": 45000
},
{
"epoch": 1.8,
"learning_rate": 9.10900900900901e-06,
"loss": 0.268,
"step": 45025
},
{
"epoch": 1.8,
"learning_rate": 9.10850850850851e-06,
"loss": 0.2566,
"step": 45050
},
{
"epoch": 1.8,
"learning_rate": 9.108008008008009e-06,
"loss": 0.2603,
"step": 45075
},
{
"epoch": 1.8,
"learning_rate": 9.107507507507508e-06,
"loss": 0.2463,
"step": 45100
},
{
"epoch": 1.8,
"learning_rate": 9.107007007007007e-06,
"loss": 0.2597,
"step": 45125
},
{
"epoch": 1.8,
"learning_rate": 9.106506506506507e-06,
"loss": 0.2531,
"step": 45150
},
{
"epoch": 1.8,
"learning_rate": 9.106006006006006e-06,
"loss": 0.2675,
"step": 45175
},
{
"epoch": 1.8,
"learning_rate": 9.105505505505507e-06,
"loss": 0.2445,
"step": 45200
},
{
"epoch": 1.8,
"learning_rate": 9.105005005005005e-06,
"loss": 0.2576,
"step": 45225
},
{
"epoch": 1.8,
"learning_rate": 9.104504504504506e-06,
"loss": 0.2473,
"step": 45250
},
{
"epoch": 1.81,
"learning_rate": 9.104004004004005e-06,
"loss": 0.2551,
"step": 45275
},
{
"epoch": 1.81,
"learning_rate": 9.103503503503504e-06,
"loss": 0.2658,
"step": 45300
},
{
"epoch": 1.81,
"learning_rate": 9.103003003003003e-06,
"loss": 0.2603,
"step": 45325
},
{
"epoch": 1.81,
"learning_rate": 9.102502502502504e-06,
"loss": 0.2618,
"step": 45350
},
{
"epoch": 1.81,
"learning_rate": 9.102002002002002e-06,
"loss": 0.2405,
"step": 45375
},
{
"epoch": 1.81,
"learning_rate": 9.101501501501501e-06,
"loss": 0.263,
"step": 45400
},
{
"epoch": 1.81,
"learning_rate": 9.101001001001002e-06,
"loss": 0.2673,
"step": 45425
},
{
"epoch": 1.81,
"learning_rate": 9.100500500500502e-06,
"loss": 0.2638,
"step": 45450
},
{
"epoch": 1.81,
"learning_rate": 9.100000000000001e-06,
"loss": 0.2583,
"step": 45475
},
{
"epoch": 1.81,
"learning_rate": 9.0994994994995e-06,
"loss": 0.2695,
"step": 45500
},
{
"epoch": 1.82,
"learning_rate": 9.098998998999e-06,
"loss": 0.2544,
"step": 45525
},
{
"epoch": 1.82,
"learning_rate": 9.098498498498499e-06,
"loss": 0.2634,
"step": 45550
},
{
"epoch": 1.82,
"learning_rate": 9.097997997997998e-06,
"loss": 0.2532,
"step": 45575
},
{
"epoch": 1.82,
"learning_rate": 9.097497497497499e-06,
"loss": 0.2559,
"step": 45600
},
{
"epoch": 1.82,
"learning_rate": 9.096996996996997e-06,
"loss": 0.2459,
"step": 45625
},
{
"epoch": 1.82,
"learning_rate": 9.096496496496498e-06,
"loss": 0.2781,
"step": 45650
},
{
"epoch": 1.82,
"learning_rate": 9.095995995995997e-06,
"loss": 0.2712,
"step": 45675
},
{
"epoch": 1.82,
"learning_rate": 9.095495495495496e-06,
"loss": 0.2597,
"step": 45700
},
{
"epoch": 1.82,
"learning_rate": 9.094994994994996e-06,
"loss": 0.275,
"step": 45725
},
{
"epoch": 1.82,
"learning_rate": 9.094494494494495e-06,
"loss": 0.2458,
"step": 45750
},
{
"epoch": 1.83,
"learning_rate": 9.093993993993994e-06,
"loss": 0.2752,
"step": 45775
},
{
"epoch": 1.83,
"learning_rate": 9.093493493493494e-06,
"loss": 0.261,
"step": 45800
},
{
"epoch": 1.83,
"learning_rate": 9.092992992992995e-06,
"loss": 0.2532,
"step": 45825
},
{
"epoch": 1.83,
"learning_rate": 9.092492492492492e-06,
"loss": 0.2847,
"step": 45850
},
{
"epoch": 1.83,
"learning_rate": 9.091991991991993e-06,
"loss": 0.2607,
"step": 45875
},
{
"epoch": 1.83,
"learning_rate": 9.091491491491492e-06,
"loss": 0.2678,
"step": 45900
},
{
"epoch": 1.83,
"learning_rate": 9.090990990990992e-06,
"loss": 0.2488,
"step": 45925
},
{
"epoch": 1.83,
"learning_rate": 9.090490490490491e-06,
"loss": 0.2628,
"step": 45950
},
{
"epoch": 1.83,
"learning_rate": 9.089989989989992e-06,
"loss": 0.2625,
"step": 45975
},
{
"epoch": 1.83,
"learning_rate": 9.08948948948949e-06,
"loss": 0.2647,
"step": 46000
},
{
"epoch": 1.83,
"eval_loss": 0.44105586409568787,
"eval_runtime": 2496.4644,
"eval_samples_per_second": 6.494,
"eval_steps_per_second": 0.163,
"eval_wer": 24.86027705614357,
"step": 46000
}
],
"max_steps": 500000,
"num_train_epochs": 20,
"total_flos": 5.309913924895223e+20,
"trial_name": null,
"trial_params": null
}