{ "best_metric": 27.969339566672204, "best_model_checkpoint": "./hamsa-tiny-pretrained/checkpoint-42500", "epoch": 2.004972331381827, "eval_steps": 2500, "global_step": 50000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 3.8e-07, "loss": 12.4564, "step": 25 }, { "epoch": 0.0, "learning_rate": 8.8e-07, "loss": 10.7741, "step": 50 }, { "epoch": 0.0, "learning_rate": 1.3800000000000001e-06, "loss": 6.9302, "step": 75 }, { "epoch": 0.0, "learning_rate": 1.8800000000000002e-06, "loss": 4.7429, "step": 100 }, { "epoch": 0.01, "learning_rate": 2.38e-06, "loss": 4.1009, "step": 125 }, { "epoch": 0.01, "learning_rate": 2.88e-06, "loss": 3.7125, "step": 150 }, { "epoch": 0.01, "learning_rate": 3.3800000000000007e-06, "loss": 3.5459, "step": 175 }, { "epoch": 0.01, "learning_rate": 3.88e-06, "loss": 3.4287, "step": 200 }, { "epoch": 0.01, "learning_rate": 4.38e-06, "loss": 3.3747, "step": 225 }, { "epoch": 0.01, "learning_rate": 4.880000000000001e-06, "loss": 3.3327, "step": 250 }, { "epoch": 0.01, "learning_rate": 5.380000000000001e-06, "loss": 3.2979, "step": 275 }, { "epoch": 0.01, "learning_rate": 5.8800000000000005e-06, "loss": 3.2587, "step": 300 }, { "epoch": 0.01, "learning_rate": 6.380000000000001e-06, "loss": 3.2244, "step": 325 }, { "epoch": 0.01, "learning_rate": 6.88e-06, "loss": 3.1921, "step": 350 }, { "epoch": 0.02, "learning_rate": 7.3800000000000005e-06, "loss": 3.174, "step": 375 }, { "epoch": 0.02, "learning_rate": 7.88e-06, "loss": 3.1549, "step": 400 }, { "epoch": 0.02, "learning_rate": 8.380000000000001e-06, "loss": 3.1301, "step": 425 }, { "epoch": 0.02, "learning_rate": 8.880000000000001e-06, "loss": 3.087, "step": 450 }, { "epoch": 0.02, "learning_rate": 9.38e-06, "loss": 3.0892, "step": 475 }, { "epoch": 0.02, "learning_rate": 9.88e-06, "loss": 3.0683, "step": 500 }, { "epoch": 0.02, "learning_rate": 9.996161616161618e-06, "loss": 3.0525, "step": 525 }, { "epoch": 0.02, "learning_rate": 9.991111111111112e-06, "loss": 3.0249, "step": 550 }, { "epoch": 0.02, "learning_rate": 9.986060606060606e-06, "loss": 3.0031, "step": 575 }, { "epoch": 0.02, "learning_rate": 9.981010101010102e-06, "loss": 2.9919, "step": 600 }, { "epoch": 0.03, "learning_rate": 9.975959595959597e-06, "loss": 2.9719, "step": 625 }, { "epoch": 0.03, "learning_rate": 9.970909090909093e-06, "loss": 2.9604, "step": 650 }, { "epoch": 0.03, "learning_rate": 9.965858585858587e-06, "loss": 2.9554, "step": 675 }, { "epoch": 0.03, "learning_rate": 9.960808080808081e-06, "loss": 2.92, "step": 700 }, { "epoch": 0.03, "learning_rate": 9.955757575757576e-06, "loss": 2.8839, "step": 725 }, { "epoch": 0.03, "learning_rate": 9.950707070707072e-06, "loss": 2.8838, "step": 750 }, { "epoch": 0.03, "learning_rate": 9.945656565656566e-06, "loss": 2.8339, "step": 775 }, { "epoch": 0.03, "learning_rate": 9.940606060606062e-06, "loss": 2.3913, "step": 800 }, { "epoch": 0.03, "learning_rate": 9.935555555555556e-06, "loss": 1.4371, "step": 825 }, { "epoch": 0.03, "learning_rate": 9.930505050505052e-06, "loss": 1.1851, "step": 850 }, { "epoch": 0.04, "learning_rate": 9.925454545454547e-06, "loss": 1.0894, "step": 875 }, { "epoch": 0.04, "learning_rate": 9.92040404040404e-06, "loss": 1.0265, "step": 900 }, { "epoch": 0.04, "learning_rate": 9.915353535353535e-06, "loss": 0.9688, "step": 925 }, { "epoch": 0.04, "learning_rate": 9.910303030303031e-06, "loss": 0.943, "step": 950 }, { "epoch": 0.04, "learning_rate": 9.905252525252525e-06, "loss": 0.9323, "step": 975 }, { "epoch": 0.04, "learning_rate": 9.900202020202021e-06, "loss": 0.9253, "step": 1000 }, { "epoch": 0.04, "learning_rate": 9.895151515151516e-06, "loss": 0.9364, "step": 1025 }, { "epoch": 0.04, "learning_rate": 9.890101010101012e-06, "loss": 0.877, "step": 1050 }, { "epoch": 0.04, "learning_rate": 9.885050505050506e-06, "loss": 0.8555, "step": 1075 }, { "epoch": 0.04, "learning_rate": 9.88e-06, "loss": 0.8677, "step": 1100 }, { "epoch": 0.05, "learning_rate": 9.874949494949496e-06, "loss": 0.8478, "step": 1125 }, { "epoch": 0.05, "learning_rate": 9.86989898989899e-06, "loss": 0.8226, "step": 1150 }, { "epoch": 0.05, "learning_rate": 9.864848484848487e-06, "loss": 0.8557, "step": 1175 }, { "epoch": 0.05, "learning_rate": 9.85979797979798e-06, "loss": 0.8147, "step": 1200 }, { "epoch": 0.05, "learning_rate": 9.854747474747475e-06, "loss": 0.8105, "step": 1225 }, { "epoch": 0.05, "learning_rate": 9.84969696969697e-06, "loss": 0.8112, "step": 1250 }, { "epoch": 0.05, "learning_rate": 9.844646464646465e-06, "loss": 0.8025, "step": 1275 }, { "epoch": 0.05, "learning_rate": 9.83959595959596e-06, "loss": 0.7667, "step": 1300 }, { "epoch": 0.05, "learning_rate": 9.834545454545456e-06, "loss": 0.7569, "step": 1325 }, { "epoch": 0.05, "learning_rate": 9.82949494949495e-06, "loss": 0.7895, "step": 1350 }, { "epoch": 0.06, "learning_rate": 9.824444444444446e-06, "loss": 0.7617, "step": 1375 }, { "epoch": 0.06, "learning_rate": 9.81939393939394e-06, "loss": 0.7461, "step": 1400 }, { "epoch": 0.06, "learning_rate": 9.814343434343435e-06, "loss": 0.7571, "step": 1425 }, { "epoch": 0.06, "learning_rate": 9.80929292929293e-06, "loss": 0.7505, "step": 1450 }, { "epoch": 0.06, "learning_rate": 9.804242424242425e-06, "loss": 0.7264, "step": 1475 }, { "epoch": 0.06, "learning_rate": 9.799191919191921e-06, "loss": 0.7555, "step": 1500 }, { "epoch": 0.06, "learning_rate": 9.794141414141415e-06, "loss": 0.7307, "step": 1525 }, { "epoch": 0.06, "learning_rate": 9.78909090909091e-06, "loss": 0.7414, "step": 1550 }, { "epoch": 0.06, "learning_rate": 9.784040404040405e-06, "loss": 0.7407, "step": 1575 }, { "epoch": 0.06, "learning_rate": 9.7789898989899e-06, "loss": 0.7128, "step": 1600 }, { "epoch": 0.07, "learning_rate": 9.773939393939394e-06, "loss": 0.7091, "step": 1625 }, { "epoch": 0.07, "learning_rate": 9.76888888888889e-06, "loss": 0.7166, "step": 1650 }, { "epoch": 0.07, "learning_rate": 9.763838383838384e-06, "loss": 0.7312, "step": 1675 }, { "epoch": 0.07, "learning_rate": 9.75878787878788e-06, "loss": 0.702, "step": 1700 }, { "epoch": 0.07, "learning_rate": 9.753737373737375e-06, "loss": 0.6995, "step": 1725 }, { "epoch": 0.07, "learning_rate": 9.748686868686869e-06, "loss": 0.7129, "step": 1750 }, { "epoch": 0.07, "learning_rate": 9.743636363636363e-06, "loss": 0.7034, "step": 1775 }, { "epoch": 0.07, "learning_rate": 9.73858585858586e-06, "loss": 0.7077, "step": 1800 }, { "epoch": 0.07, "learning_rate": 9.733535353535353e-06, "loss": 0.7103, "step": 1825 }, { "epoch": 0.07, "learning_rate": 9.72848484848485e-06, "loss": 0.6812, "step": 1850 }, { "epoch": 0.08, "learning_rate": 9.723434343434345e-06, "loss": 0.6833, "step": 1875 }, { "epoch": 0.08, "learning_rate": 9.71838383838384e-06, "loss": 0.7074, "step": 1900 }, { "epoch": 0.08, "learning_rate": 9.713333333333334e-06, "loss": 0.6759, "step": 1925 }, { "epoch": 0.08, "learning_rate": 9.708282828282828e-06, "loss": 0.6769, "step": 1950 }, { "epoch": 0.08, "learning_rate": 9.703232323232324e-06, "loss": 0.6499, "step": 1975 }, { "epoch": 0.08, "learning_rate": 9.698181818181819e-06, "loss": 0.671, "step": 2000 }, { "epoch": 0.08, "learning_rate": 9.693131313131315e-06, "loss": 0.6632, "step": 2025 }, { "epoch": 0.08, "learning_rate": 9.688080808080809e-06, "loss": 0.6818, "step": 2050 }, { "epoch": 0.08, "learning_rate": 9.683030303030305e-06, "loss": 0.655, "step": 2075 }, { "epoch": 0.08, "learning_rate": 9.6779797979798e-06, "loss": 0.6762, "step": 2100 }, { "epoch": 0.09, "learning_rate": 9.672929292929294e-06, "loss": 0.6799, "step": 2125 }, { "epoch": 0.09, "learning_rate": 9.667878787878788e-06, "loss": 0.6555, "step": 2150 }, { "epoch": 0.09, "learning_rate": 9.662828282828284e-06, "loss": 0.6549, "step": 2175 }, { "epoch": 0.09, "learning_rate": 9.657777777777778e-06, "loss": 0.665, "step": 2200 }, { "epoch": 0.09, "learning_rate": 9.652727272727274e-06, "loss": 0.6663, "step": 2225 }, { "epoch": 0.09, "learning_rate": 9.647676767676768e-06, "loss": 0.6383, "step": 2250 }, { "epoch": 0.09, "learning_rate": 9.642626262626263e-06, "loss": 0.6426, "step": 2275 }, { "epoch": 0.09, "learning_rate": 9.637575757575759e-06, "loss": 0.6448, "step": 2300 }, { "epoch": 0.09, "learning_rate": 9.632525252525253e-06, "loss": 0.6444, "step": 2325 }, { "epoch": 0.09, "learning_rate": 9.627474747474749e-06, "loss": 0.6468, "step": 2350 }, { "epoch": 0.1, "learning_rate": 9.622424242424243e-06, "loss": 0.659, "step": 2375 }, { "epoch": 0.1, "learning_rate": 9.61737373737374e-06, "loss": 0.6481, "step": 2400 }, { "epoch": 0.1, "learning_rate": 9.612323232323234e-06, "loss": 0.6516, "step": 2425 }, { "epoch": 0.1, "learning_rate": 9.607272727272728e-06, "loss": 0.6222, "step": 2450 }, { "epoch": 0.1, "learning_rate": 9.602222222222222e-06, "loss": 0.672, "step": 2475 }, { "epoch": 0.1, "learning_rate": 9.597171717171718e-06, "loss": 0.6597, "step": 2500 }, { "epoch": 0.1, "eval_loss": 0.6394317150115967, "eval_runtime": 334.7136, "eval_samples_per_second": 14.953, "eval_steps_per_second": 1.87, "eval_wer": 48.83836825743373, "step": 2500 }, { "epoch": 0.1, "learning_rate": 9.592121212121212e-06, "loss": 0.633, "step": 2525 }, { "epoch": 0.1, "learning_rate": 9.587070707070708e-06, "loss": 0.6082, "step": 2550 }, { "epoch": 0.1, "learning_rate": 9.582020202020203e-06, "loss": 0.6322, "step": 2575 }, { "epoch": 0.1, "learning_rate": 9.576969696969699e-06, "loss": 0.6516, "step": 2600 }, { "epoch": 0.11, "learning_rate": 9.571919191919193e-06, "loss": 0.637, "step": 2625 }, { "epoch": 0.11, "learning_rate": 9.566868686868687e-06, "loss": 0.6358, "step": 2650 }, { "epoch": 0.11, "learning_rate": 9.561818181818182e-06, "loss": 0.6416, "step": 2675 }, { "epoch": 0.11, "learning_rate": 9.556767676767678e-06, "loss": 0.6102, "step": 2700 }, { "epoch": 0.11, "learning_rate": 9.551717171717174e-06, "loss": 0.6196, "step": 2725 }, { "epoch": 0.11, "learning_rate": 9.546666666666668e-06, "loss": 0.6398, "step": 2750 }, { "epoch": 0.11, "learning_rate": 9.541616161616162e-06, "loss": 0.6186, "step": 2775 }, { "epoch": 0.11, "learning_rate": 9.536565656565656e-06, "loss": 0.618, "step": 2800 }, { "epoch": 0.11, "learning_rate": 9.531515151515152e-06, "loss": 0.622, "step": 2825 }, { "epoch": 0.11, "learning_rate": 9.526464646464647e-06, "loss": 0.6157, "step": 2850 }, { "epoch": 0.12, "learning_rate": 9.521414141414143e-06, "loss": 0.6351, "step": 2875 }, { "epoch": 0.12, "learning_rate": 9.516363636363637e-06, "loss": 0.6265, "step": 2900 }, { "epoch": 0.12, "learning_rate": 9.511313131313133e-06, "loss": 0.6202, "step": 2925 }, { "epoch": 0.12, "learning_rate": 9.506262626262627e-06, "loss": 0.5981, "step": 2950 }, { "epoch": 0.12, "learning_rate": 9.501212121212122e-06, "loss": 0.5991, "step": 2975 }, { "epoch": 0.12, "learning_rate": 9.496161616161616e-06, "loss": 0.5855, "step": 3000 }, { "epoch": 0.12, "learning_rate": 9.491111111111112e-06, "loss": 0.6107, "step": 3025 }, { "epoch": 0.12, "learning_rate": 9.486060606060606e-06, "loss": 0.5846, "step": 3050 }, { "epoch": 0.12, "learning_rate": 9.481010101010102e-06, "loss": 0.5985, "step": 3075 }, { "epoch": 0.12, "learning_rate": 9.475959595959596e-06, "loss": 0.6231, "step": 3100 }, { "epoch": 0.13, "learning_rate": 9.470909090909092e-06, "loss": 0.5999, "step": 3125 }, { "epoch": 0.13, "learning_rate": 9.465858585858587e-06, "loss": 0.5851, "step": 3150 }, { "epoch": 0.13, "learning_rate": 9.460808080808081e-06, "loss": 0.6101, "step": 3175 }, { "epoch": 0.13, "learning_rate": 9.455757575757577e-06, "loss": 0.6155, "step": 3200 }, { "epoch": 0.13, "learning_rate": 9.450707070707071e-06, "loss": 0.617, "step": 3225 }, { "epoch": 0.13, "learning_rate": 9.445656565656567e-06, "loss": 0.5908, "step": 3250 }, { "epoch": 0.13, "learning_rate": 9.440606060606062e-06, "loss": 0.5898, "step": 3275 }, { "epoch": 0.13, "learning_rate": 9.435555555555556e-06, "loss": 0.5761, "step": 3300 }, { "epoch": 0.13, "learning_rate": 9.43050505050505e-06, "loss": 0.6068, "step": 3325 }, { "epoch": 0.13, "learning_rate": 9.425454545454546e-06, "loss": 0.6193, "step": 3350 }, { "epoch": 0.14, "learning_rate": 9.42040404040404e-06, "loss": 0.5659, "step": 3375 }, { "epoch": 0.14, "learning_rate": 9.415353535353537e-06, "loss": 0.5706, "step": 3400 }, { "epoch": 0.14, "learning_rate": 9.41030303030303e-06, "loss": 0.5881, "step": 3425 }, { "epoch": 0.14, "learning_rate": 9.405252525252527e-06, "loss": 0.587, "step": 3450 }, { "epoch": 0.14, "learning_rate": 9.400202020202021e-06, "loss": 0.5999, "step": 3475 }, { "epoch": 0.14, "learning_rate": 9.395151515151515e-06, "loss": 0.5927, "step": 3500 }, { "epoch": 0.14, "learning_rate": 9.39010101010101e-06, "loss": 0.57, "step": 3525 }, { "epoch": 0.14, "learning_rate": 9.385050505050506e-06, "loss": 0.5748, "step": 3550 }, { "epoch": 0.14, "learning_rate": 9.38e-06, "loss": 0.5901, "step": 3575 }, { "epoch": 0.14, "learning_rate": 9.374949494949496e-06, "loss": 0.5614, "step": 3600 }, { "epoch": 0.15, "learning_rate": 9.369898989898992e-06, "loss": 0.5811, "step": 3625 }, { "epoch": 0.15, "learning_rate": 9.364848484848486e-06, "loss": 0.5777, "step": 3650 }, { "epoch": 0.15, "learning_rate": 9.35979797979798e-06, "loss": 0.595, "step": 3675 }, { "epoch": 0.15, "learning_rate": 9.354747474747475e-06, "loss": 0.5798, "step": 3700 }, { "epoch": 0.15, "learning_rate": 9.34969696969697e-06, "loss": 0.5856, "step": 3725 }, { "epoch": 0.15, "learning_rate": 9.344646464646465e-06, "loss": 0.5863, "step": 3750 }, { "epoch": 0.15, "learning_rate": 9.339595959595961e-06, "loss": 0.5817, "step": 3775 }, { "epoch": 0.15, "learning_rate": 9.334545454545455e-06, "loss": 0.5943, "step": 3800 }, { "epoch": 0.15, "learning_rate": 9.32949494949495e-06, "loss": 0.56, "step": 3825 }, { "epoch": 0.15, "learning_rate": 9.324444444444444e-06, "loss": 0.573, "step": 3850 }, { "epoch": 0.16, "learning_rate": 9.31939393939394e-06, "loss": 0.5525, "step": 3875 }, { "epoch": 0.16, "learning_rate": 9.314343434343434e-06, "loss": 0.6028, "step": 3900 }, { "epoch": 0.16, "learning_rate": 9.30929292929293e-06, "loss": 0.5804, "step": 3925 }, { "epoch": 0.16, "learning_rate": 9.304242424242425e-06, "loss": 0.5647, "step": 3950 }, { "epoch": 0.16, "learning_rate": 9.29919191919192e-06, "loss": 0.5758, "step": 3975 }, { "epoch": 0.16, "learning_rate": 9.294141414141415e-06, "loss": 0.5667, "step": 4000 }, { "epoch": 0.16, "learning_rate": 9.28909090909091e-06, "loss": 0.558, "step": 4025 }, { "epoch": 0.16, "learning_rate": 9.284040404040405e-06, "loss": 0.5671, "step": 4050 }, { "epoch": 0.16, "learning_rate": 9.2789898989899e-06, "loss": 0.5421, "step": 4075 }, { "epoch": 0.16, "learning_rate": 9.273939393939395e-06, "loss": 0.551, "step": 4100 }, { "epoch": 0.17, "learning_rate": 9.26888888888889e-06, "loss": 0.5646, "step": 4125 }, { "epoch": 0.17, "learning_rate": 9.263838383838386e-06, "loss": 0.5756, "step": 4150 }, { "epoch": 0.17, "learning_rate": 9.25878787878788e-06, "loss": 0.5527, "step": 4175 }, { "epoch": 0.17, "learning_rate": 9.253737373737374e-06, "loss": 0.5491, "step": 4200 }, { "epoch": 0.17, "learning_rate": 9.248686868686869e-06, "loss": 0.5713, "step": 4225 }, { "epoch": 0.17, "learning_rate": 9.243636363636365e-06, "loss": 0.5914, "step": 4250 }, { "epoch": 0.17, "learning_rate": 9.238585858585859e-06, "loss": 0.5546, "step": 4275 }, { "epoch": 0.17, "learning_rate": 9.233535353535355e-06, "loss": 0.5616, "step": 4300 }, { "epoch": 0.17, "learning_rate": 9.22848484848485e-06, "loss": 0.5532, "step": 4325 }, { "epoch": 0.17, "learning_rate": 9.223434343434343e-06, "loss": 0.5596, "step": 4350 }, { "epoch": 0.18, "learning_rate": 9.21838383838384e-06, "loss": 0.5584, "step": 4375 }, { "epoch": 0.18, "learning_rate": 9.213333333333334e-06, "loss": 0.5418, "step": 4400 }, { "epoch": 0.18, "learning_rate": 9.208282828282828e-06, "loss": 0.5438, "step": 4425 }, { "epoch": 0.18, "learning_rate": 9.203232323232324e-06, "loss": 0.5684, "step": 4450 }, { "epoch": 0.18, "learning_rate": 9.19818181818182e-06, "loss": 0.5224, "step": 4475 }, { "epoch": 0.18, "learning_rate": 9.193131313131314e-06, "loss": 0.5501, "step": 4500 }, { "epoch": 0.18, "learning_rate": 9.188080808080809e-06, "loss": 0.5429, "step": 4525 }, { "epoch": 0.18, "learning_rate": 9.183030303030303e-06, "loss": 0.5529, "step": 4550 }, { "epoch": 0.18, "learning_rate": 9.177979797979799e-06, "loss": 0.5694, "step": 4575 }, { "epoch": 0.18, "learning_rate": 9.172929292929293e-06, "loss": 0.5494, "step": 4600 }, { "epoch": 0.19, "learning_rate": 9.16787878787879e-06, "loss": 0.5686, "step": 4625 }, { "epoch": 0.19, "learning_rate": 9.162828282828284e-06, "loss": 0.5311, "step": 4650 }, { "epoch": 0.19, "learning_rate": 9.15777777777778e-06, "loss": 0.5439, "step": 4675 }, { "epoch": 0.19, "learning_rate": 9.152727272727274e-06, "loss": 0.5351, "step": 4700 }, { "epoch": 0.19, "learning_rate": 9.147676767676768e-06, "loss": 0.5438, "step": 4725 }, { "epoch": 0.19, "learning_rate": 9.142626262626262e-06, "loss": 0.5627, "step": 4750 }, { "epoch": 0.19, "learning_rate": 9.137575757575758e-06, "loss": 0.5443, "step": 4775 }, { "epoch": 0.19, "learning_rate": 9.132525252525253e-06, "loss": 0.5367, "step": 4800 }, { "epoch": 0.19, "learning_rate": 9.127474747474749e-06, "loss": 0.5256, "step": 4825 }, { "epoch": 0.19, "learning_rate": 9.122424242424243e-06, "loss": 0.5447, "step": 4850 }, { "epoch": 0.2, "learning_rate": 9.117373737373737e-06, "loss": 0.5295, "step": 4875 }, { "epoch": 0.2, "learning_rate": 9.112323232323233e-06, "loss": 0.5365, "step": 4900 }, { "epoch": 0.2, "learning_rate": 9.107272727272728e-06, "loss": 0.5309, "step": 4925 }, { "epoch": 0.2, "learning_rate": 9.102222222222224e-06, "loss": 0.5223, "step": 4950 }, { "epoch": 0.2, "learning_rate": 9.097171717171718e-06, "loss": 0.536, "step": 4975 }, { "epoch": 0.2, "learning_rate": 9.092121212121214e-06, "loss": 0.5442, "step": 5000 }, { "epoch": 0.2, "eval_loss": 0.5454992055892944, "eval_runtime": 329.8023, "eval_samples_per_second": 15.176, "eval_steps_per_second": 1.898, "eval_wer": 41.85433921070742, "step": 5000 }, { "epoch": 0.2, "learning_rate": 9.087070707070708e-06, "loss": 0.5432, "step": 5025 }, { "epoch": 0.2, "learning_rate": 9.082020202020202e-06, "loss": 0.5454, "step": 5050 }, { "epoch": 0.2, "learning_rate": 9.076969696969697e-06, "loss": 0.5455, "step": 5075 }, { "epoch": 0.2, "learning_rate": 9.071919191919193e-06, "loss": 0.5462, "step": 5100 }, { "epoch": 0.21, "learning_rate": 9.066868686868687e-06, "loss": 0.5283, "step": 5125 }, { "epoch": 0.21, "learning_rate": 9.061818181818183e-06, "loss": 0.5418, "step": 5150 }, { "epoch": 0.21, "learning_rate": 9.056767676767677e-06, "loss": 0.5293, "step": 5175 }, { "epoch": 0.21, "learning_rate": 9.051717171717173e-06, "loss": 0.5228, "step": 5200 }, { "epoch": 0.21, "learning_rate": 9.046666666666668e-06, "loss": 0.5381, "step": 5225 }, { "epoch": 0.21, "learning_rate": 9.041616161616162e-06, "loss": 0.5572, "step": 5250 }, { "epoch": 0.21, "learning_rate": 9.036565656565656e-06, "loss": 0.5243, "step": 5275 }, { "epoch": 0.21, "learning_rate": 9.031515151515152e-06, "loss": 0.5353, "step": 5300 }, { "epoch": 0.21, "learning_rate": 9.026464646464648e-06, "loss": 0.5348, "step": 5325 }, { "epoch": 0.21, "learning_rate": 9.021414141414142e-06, "loss": 0.5445, "step": 5350 }, { "epoch": 0.22, "learning_rate": 9.016363636363637e-06, "loss": 0.516, "step": 5375 }, { "epoch": 0.22, "learning_rate": 9.011313131313133e-06, "loss": 0.5268, "step": 5400 }, { "epoch": 0.22, "learning_rate": 9.006262626262627e-06, "loss": 0.5416, "step": 5425 }, { "epoch": 0.22, "learning_rate": 9.001212121212121e-06, "loss": 0.5564, "step": 5450 }, { "epoch": 0.22, "learning_rate": 8.996161616161617e-06, "loss": 0.5475, "step": 5475 }, { "epoch": 0.22, "learning_rate": 8.991111111111112e-06, "loss": 0.5441, "step": 5500 }, { "epoch": 0.22, "learning_rate": 8.986060606060608e-06, "loss": 0.5281, "step": 5525 }, { "epoch": 0.22, "learning_rate": 8.981010101010102e-06, "loss": 0.5289, "step": 5550 }, { "epoch": 0.22, "learning_rate": 8.975959595959596e-06, "loss": 0.5466, "step": 5575 }, { "epoch": 0.22, "learning_rate": 8.97090909090909e-06, "loss": 0.5344, "step": 5600 }, { "epoch": 0.23, "learning_rate": 8.965858585858586e-06, "loss": 0.51, "step": 5625 }, { "epoch": 0.23, "learning_rate": 8.96080808080808e-06, "loss": 0.498, "step": 5650 }, { "epoch": 0.23, "learning_rate": 8.955757575757577e-06, "loss": 0.5346, "step": 5675 }, { "epoch": 0.23, "learning_rate": 8.950707070707071e-06, "loss": 0.5269, "step": 5700 }, { "epoch": 0.23, "learning_rate": 8.945656565656567e-06, "loss": 0.5345, "step": 5725 }, { "epoch": 0.23, "learning_rate": 8.940606060606061e-06, "loss": 0.5265, "step": 5750 }, { "epoch": 0.23, "learning_rate": 8.935555555555556e-06, "loss": 0.5264, "step": 5775 }, { "epoch": 0.23, "learning_rate": 8.930505050505052e-06, "loss": 0.5177, "step": 5800 }, { "epoch": 0.23, "learning_rate": 8.925454545454546e-06, "loss": 0.533, "step": 5825 }, { "epoch": 0.23, "learning_rate": 8.920404040404042e-06, "loss": 0.5188, "step": 5850 }, { "epoch": 0.24, "learning_rate": 8.915353535353536e-06, "loss": 0.5245, "step": 5875 }, { "epoch": 0.24, "learning_rate": 8.91030303030303e-06, "loss": 0.5166, "step": 5900 }, { "epoch": 0.24, "learning_rate": 8.905252525252527e-06, "loss": 0.5323, "step": 5925 }, { "epoch": 0.24, "learning_rate": 8.90020202020202e-06, "loss": 0.5216, "step": 5950 }, { "epoch": 0.24, "learning_rate": 8.895151515151515e-06, "loss": 0.5037, "step": 5975 }, { "epoch": 0.24, "learning_rate": 8.890101010101011e-06, "loss": 0.5348, "step": 6000 }, { "epoch": 0.24, "learning_rate": 8.885050505050505e-06, "loss": 0.5265, "step": 6025 }, { "epoch": 0.24, "learning_rate": 8.880000000000001e-06, "loss": 0.5232, "step": 6050 }, { "epoch": 0.24, "learning_rate": 8.874949494949496e-06, "loss": 0.5024, "step": 6075 }, { "epoch": 0.24, "learning_rate": 8.86989898989899e-06, "loss": 0.5103, "step": 6100 }, { "epoch": 0.25, "learning_rate": 8.864848484848484e-06, "loss": 0.4969, "step": 6125 }, { "epoch": 0.25, "learning_rate": 8.85979797979798e-06, "loss": 0.5156, "step": 6150 }, { "epoch": 0.25, "learning_rate": 8.854747474747476e-06, "loss": 0.5261, "step": 6175 }, { "epoch": 0.25, "learning_rate": 8.84969696969697e-06, "loss": 0.5004, "step": 6200 }, { "epoch": 0.25, "learning_rate": 8.844646464646467e-06, "loss": 0.4955, "step": 6225 }, { "epoch": 0.25, "learning_rate": 8.83959595959596e-06, "loss": 0.5173, "step": 6250 }, { "epoch": 0.25, "learning_rate": 8.834545454545455e-06, "loss": 0.5217, "step": 6275 }, { "epoch": 0.25, "learning_rate": 8.82949494949495e-06, "loss": 0.512, "step": 6300 }, { "epoch": 0.25, "learning_rate": 8.824444444444445e-06, "loss": 0.506, "step": 6325 }, { "epoch": 0.25, "learning_rate": 8.81939393939394e-06, "loss": 0.5232, "step": 6350 }, { "epoch": 0.26, "learning_rate": 8.814343434343436e-06, "loss": 0.5187, "step": 6375 }, { "epoch": 0.26, "learning_rate": 8.80929292929293e-06, "loss": 0.4965, "step": 6400 }, { "epoch": 0.26, "learning_rate": 8.804242424242426e-06, "loss": 0.5071, "step": 6425 }, { "epoch": 0.26, "learning_rate": 8.79919191919192e-06, "loss": 0.5165, "step": 6450 }, { "epoch": 0.26, "learning_rate": 8.794141414141415e-06, "loss": 0.5104, "step": 6475 }, { "epoch": 0.26, "learning_rate": 8.789090909090909e-06, "loss": 0.4947, "step": 6500 }, { "epoch": 0.26, "learning_rate": 8.784040404040405e-06, "loss": 0.4864, "step": 6525 }, { "epoch": 0.26, "learning_rate": 8.7789898989899e-06, "loss": 0.5373, "step": 6550 }, { "epoch": 0.26, "learning_rate": 8.773939393939395e-06, "loss": 0.5253, "step": 6575 }, { "epoch": 0.26, "learning_rate": 8.76888888888889e-06, "loss": 0.5056, "step": 6600 }, { "epoch": 0.27, "learning_rate": 8.763838383838384e-06, "loss": 0.5065, "step": 6625 }, { "epoch": 0.27, "learning_rate": 8.75878787878788e-06, "loss": 0.5022, "step": 6650 }, { "epoch": 0.27, "learning_rate": 8.753737373737374e-06, "loss": 0.4991, "step": 6675 }, { "epoch": 0.27, "learning_rate": 8.74868686868687e-06, "loss": 0.5224, "step": 6700 }, { "epoch": 0.27, "learning_rate": 8.743636363636364e-06, "loss": 0.5293, "step": 6725 }, { "epoch": 0.27, "learning_rate": 8.73858585858586e-06, "loss": 0.5131, "step": 6750 }, { "epoch": 0.27, "learning_rate": 8.733535353535355e-06, "loss": 0.4972, "step": 6775 }, { "epoch": 0.27, "learning_rate": 8.728484848484849e-06, "loss": 0.4901, "step": 6800 }, { "epoch": 0.27, "learning_rate": 8.723434343434343e-06, "loss": 0.4907, "step": 6825 }, { "epoch": 0.27, "learning_rate": 8.71838383838384e-06, "loss": 0.4896, "step": 6850 }, { "epoch": 0.28, "learning_rate": 8.713333333333333e-06, "loss": 0.5052, "step": 6875 }, { "epoch": 0.28, "learning_rate": 8.70828282828283e-06, "loss": 0.5105, "step": 6900 }, { "epoch": 0.28, "learning_rate": 8.703232323232324e-06, "loss": 0.5036, "step": 6925 }, { "epoch": 0.28, "learning_rate": 8.69818181818182e-06, "loss": 0.4917, "step": 6950 }, { "epoch": 0.28, "learning_rate": 8.693131313131314e-06, "loss": 0.4844, "step": 6975 }, { "epoch": 0.28, "learning_rate": 8.688080808080808e-06, "loss": 0.5248, "step": 7000 }, { "epoch": 0.28, "learning_rate": 8.683030303030304e-06, "loss": 0.497, "step": 7025 }, { "epoch": 0.28, "learning_rate": 8.677979797979799e-06, "loss": 0.4918, "step": 7050 }, { "epoch": 0.28, "learning_rate": 8.672929292929295e-06, "loss": 0.5221, "step": 7075 }, { "epoch": 0.28, "learning_rate": 8.667878787878789e-06, "loss": 0.5155, "step": 7100 }, { "epoch": 0.29, "learning_rate": 8.662828282828283e-06, "loss": 0.5031, "step": 7125 }, { "epoch": 0.29, "learning_rate": 8.657777777777778e-06, "loss": 0.4829, "step": 7150 }, { "epoch": 0.29, "learning_rate": 8.652727272727274e-06, "loss": 0.4863, "step": 7175 }, { "epoch": 0.29, "learning_rate": 8.647676767676768e-06, "loss": 0.4697, "step": 7200 }, { "epoch": 0.29, "learning_rate": 8.642626262626264e-06, "loss": 0.4705, "step": 7225 }, { "epoch": 0.29, "learning_rate": 8.637575757575758e-06, "loss": 0.5049, "step": 7250 }, { "epoch": 0.29, "learning_rate": 8.632525252525254e-06, "loss": 0.5023, "step": 7275 }, { "epoch": 0.29, "learning_rate": 8.627474747474748e-06, "loss": 0.5118, "step": 7300 }, { "epoch": 0.29, "learning_rate": 8.622424242424243e-06, "loss": 0.5219, "step": 7325 }, { "epoch": 0.29, "learning_rate": 8.617373737373737e-06, "loss": 0.4733, "step": 7350 }, { "epoch": 0.3, "learning_rate": 8.612323232323233e-06, "loss": 0.4903, "step": 7375 }, { "epoch": 0.3, "learning_rate": 8.607272727272727e-06, "loss": 0.4855, "step": 7400 }, { "epoch": 0.3, "learning_rate": 8.602222222222223e-06, "loss": 0.4954, "step": 7425 }, { "epoch": 0.3, "learning_rate": 8.597171717171718e-06, "loss": 0.4778, "step": 7450 }, { "epoch": 0.3, "learning_rate": 8.592121212121214e-06, "loss": 0.5003, "step": 7475 }, { "epoch": 0.3, "learning_rate": 8.587070707070708e-06, "loss": 0.4954, "step": 7500 }, { "epoch": 0.3, "eval_loss": 0.5018385052680969, "eval_runtime": 326.6554, "eval_samples_per_second": 15.322, "eval_steps_per_second": 1.916, "eval_wer": 39.86093642468972, "step": 7500 }, { "epoch": 0.3, "learning_rate": 8.582020202020202e-06, "loss": 0.5221, "step": 7525 }, { "epoch": 0.3, "learning_rate": 8.576969696969698e-06, "loss": 0.4649, "step": 7550 }, { "epoch": 0.3, "learning_rate": 8.571919191919192e-06, "loss": 0.5203, "step": 7575 }, { "epoch": 0.3, "learning_rate": 8.566868686868688e-06, "loss": 0.4946, "step": 7600 }, { "epoch": 0.31, "learning_rate": 8.561818181818183e-06, "loss": 0.4797, "step": 7625 }, { "epoch": 0.31, "learning_rate": 8.556767676767677e-06, "loss": 0.5038, "step": 7650 }, { "epoch": 0.31, "learning_rate": 8.551717171717171e-06, "loss": 0.4835, "step": 7675 }, { "epoch": 0.31, "learning_rate": 8.546666666666667e-06, "loss": 0.5149, "step": 7700 }, { "epoch": 0.31, "learning_rate": 8.541616161616162e-06, "loss": 0.4866, "step": 7725 }, { "epoch": 0.31, "learning_rate": 8.536565656565658e-06, "loss": 0.4996, "step": 7750 }, { "epoch": 0.31, "learning_rate": 8.531515151515152e-06, "loss": 0.4758, "step": 7775 }, { "epoch": 0.31, "learning_rate": 8.526464646464648e-06, "loss": 0.5027, "step": 7800 }, { "epoch": 0.31, "learning_rate": 8.521414141414142e-06, "loss": 0.4976, "step": 7825 }, { "epoch": 0.31, "learning_rate": 8.516363636363636e-06, "loss": 0.4817, "step": 7850 }, { "epoch": 0.32, "learning_rate": 8.511313131313132e-06, "loss": 0.5112, "step": 7875 }, { "epoch": 0.32, "learning_rate": 8.506262626262627e-06, "loss": 0.476, "step": 7900 }, { "epoch": 0.32, "learning_rate": 8.501212121212123e-06, "loss": 0.4719, "step": 7925 }, { "epoch": 0.32, "learning_rate": 8.496161616161617e-06, "loss": 0.4911, "step": 7950 }, { "epoch": 0.32, "learning_rate": 8.491111111111113e-06, "loss": 0.503, "step": 7975 }, { "epoch": 0.32, "learning_rate": 8.486060606060607e-06, "loss": 0.4636, "step": 8000 }, { "epoch": 0.32, "learning_rate": 8.481010101010102e-06, "loss": 0.4923, "step": 8025 }, { "epoch": 0.32, "learning_rate": 8.475959595959596e-06, "loss": 0.4896, "step": 8050 }, { "epoch": 0.32, "learning_rate": 8.470909090909092e-06, "loss": 0.4901, "step": 8075 }, { "epoch": 0.32, "learning_rate": 8.465858585858586e-06, "loss": 0.4871, "step": 8100 }, { "epoch": 0.33, "learning_rate": 8.460808080808082e-06, "loss": 0.4808, "step": 8125 }, { "epoch": 0.33, "learning_rate": 8.455757575757576e-06, "loss": 0.4749, "step": 8150 }, { "epoch": 0.33, "learning_rate": 8.45070707070707e-06, "loss": 0.4905, "step": 8175 }, { "epoch": 0.33, "learning_rate": 8.445656565656565e-06, "loss": 0.4963, "step": 8200 }, { "epoch": 0.33, "learning_rate": 8.440606060606061e-06, "loss": 0.4755, "step": 8225 }, { "epoch": 0.33, "learning_rate": 8.435555555555555e-06, "loss": 0.5149, "step": 8250 }, { "epoch": 0.33, "learning_rate": 8.430505050505051e-06, "loss": 0.4944, "step": 8275 }, { "epoch": 0.33, "learning_rate": 8.425454545454547e-06, "loss": 0.4671, "step": 8300 }, { "epoch": 0.33, "learning_rate": 8.420404040404042e-06, "loss": 0.4706, "step": 8325 }, { "epoch": 0.33, "learning_rate": 8.415353535353536e-06, "loss": 0.4601, "step": 8350 }, { "epoch": 0.34, "learning_rate": 8.41030303030303e-06, "loss": 0.4612, "step": 8375 }, { "epoch": 0.34, "learning_rate": 8.405252525252526e-06, "loss": 0.4672, "step": 8400 }, { "epoch": 0.34, "learning_rate": 8.40020202020202e-06, "loss": 0.4875, "step": 8425 }, { "epoch": 0.34, "learning_rate": 8.395151515151516e-06, "loss": 0.5222, "step": 8450 }, { "epoch": 0.34, "learning_rate": 8.39010101010101e-06, "loss": 0.477, "step": 8475 }, { "epoch": 0.34, "learning_rate": 8.385050505050507e-06, "loss": 0.477, "step": 8500 }, { "epoch": 0.34, "learning_rate": 8.380000000000001e-06, "loss": 0.4654, "step": 8525 }, { "epoch": 0.34, "learning_rate": 8.374949494949495e-06, "loss": 0.4953, "step": 8550 }, { "epoch": 0.34, "learning_rate": 8.36989898989899e-06, "loss": 0.4741, "step": 8575 }, { "epoch": 0.34, "learning_rate": 8.364848484848486e-06, "loss": 0.5095, "step": 8600 }, { "epoch": 0.35, "learning_rate": 8.35979797979798e-06, "loss": 0.4731, "step": 8625 }, { "epoch": 0.35, "learning_rate": 8.354747474747476e-06, "loss": 0.4665, "step": 8650 }, { "epoch": 0.35, "learning_rate": 8.34969696969697e-06, "loss": 0.483, "step": 8675 }, { "epoch": 0.35, "learning_rate": 8.344646464646465e-06, "loss": 0.4905, "step": 8700 }, { "epoch": 0.35, "learning_rate": 8.33959595959596e-06, "loss": 0.4658, "step": 8725 }, { "epoch": 0.35, "learning_rate": 8.334545454545455e-06, "loss": 0.4826, "step": 8750 }, { "epoch": 0.35, "learning_rate": 8.32949494949495e-06, "loss": 0.478, "step": 8775 }, { "epoch": 0.35, "learning_rate": 8.324444444444445e-06, "loss": 0.4846, "step": 8800 }, { "epoch": 0.35, "learning_rate": 8.319393939393941e-06, "loss": 0.4757, "step": 8825 }, { "epoch": 0.35, "learning_rate": 8.314343434343435e-06, "loss": 0.4847, "step": 8850 }, { "epoch": 0.36, "learning_rate": 8.30929292929293e-06, "loss": 0.4886, "step": 8875 }, { "epoch": 0.36, "learning_rate": 8.304242424242424e-06, "loss": 0.4724, "step": 8900 }, { "epoch": 0.36, "learning_rate": 8.29919191919192e-06, "loss": 0.4785, "step": 8925 }, { "epoch": 0.36, "learning_rate": 8.294141414141414e-06, "loss": 0.4844, "step": 8950 }, { "epoch": 0.36, "learning_rate": 8.28909090909091e-06, "loss": 0.4694, "step": 8975 }, { "epoch": 0.36, "learning_rate": 8.284040404040405e-06, "loss": 0.4852, "step": 9000 }, { "epoch": 0.36, "learning_rate": 8.2789898989899e-06, "loss": 0.4963, "step": 9025 }, { "epoch": 0.36, "learning_rate": 8.273939393939395e-06, "loss": 0.4735, "step": 9050 }, { "epoch": 0.36, "learning_rate": 8.268888888888889e-06, "loss": 0.4733, "step": 9075 }, { "epoch": 0.36, "learning_rate": 8.263838383838383e-06, "loss": 0.4537, "step": 9100 }, { "epoch": 0.37, "learning_rate": 8.25878787878788e-06, "loss": 0.4843, "step": 9125 }, { "epoch": 0.37, "learning_rate": 8.253737373737375e-06, "loss": 0.4789, "step": 9150 }, { "epoch": 0.37, "learning_rate": 8.24868686868687e-06, "loss": 0.4908, "step": 9175 }, { "epoch": 0.37, "learning_rate": 8.243636363636364e-06, "loss": 0.4735, "step": 9200 }, { "epoch": 0.37, "learning_rate": 8.238585858585858e-06, "loss": 0.476, "step": 9225 }, { "epoch": 0.37, "learning_rate": 8.233535353535354e-06, "loss": 0.4844, "step": 9250 }, { "epoch": 0.37, "learning_rate": 8.228484848484849e-06, "loss": 0.4828, "step": 9275 }, { "epoch": 0.37, "learning_rate": 8.223434343434345e-06, "loss": 0.5066, "step": 9300 }, { "epoch": 0.37, "learning_rate": 8.218383838383839e-06, "loss": 0.4674, "step": 9325 }, { "epoch": 0.37, "learning_rate": 8.213333333333335e-06, "loss": 0.47, "step": 9350 }, { "epoch": 0.38, "learning_rate": 8.20828282828283e-06, "loss": 0.4821, "step": 9375 }, { "epoch": 0.38, "learning_rate": 8.203232323232323e-06, "loss": 0.4588, "step": 9400 }, { "epoch": 0.38, "learning_rate": 8.198181818181818e-06, "loss": 0.4674, "step": 9425 }, { "epoch": 0.38, "learning_rate": 8.193131313131314e-06, "loss": 0.4825, "step": 9450 }, { "epoch": 0.38, "learning_rate": 8.188080808080808e-06, "loss": 0.472, "step": 9475 }, { "epoch": 0.38, "learning_rate": 8.183030303030304e-06, "loss": 0.4723, "step": 9500 }, { "epoch": 0.38, "learning_rate": 8.177979797979798e-06, "loss": 0.4703, "step": 9525 }, { "epoch": 0.38, "learning_rate": 8.172929292929294e-06, "loss": 0.4945, "step": 9550 }, { "epoch": 0.38, "learning_rate": 8.167878787878789e-06, "loss": 0.4829, "step": 9575 }, { "epoch": 0.38, "learning_rate": 8.162828282828283e-06, "loss": 0.4595, "step": 9600 }, { "epoch": 0.39, "learning_rate": 8.157777777777779e-06, "loss": 0.4775, "step": 9625 }, { "epoch": 0.39, "learning_rate": 8.152727272727273e-06, "loss": 0.4583, "step": 9650 }, { "epoch": 0.39, "learning_rate": 8.14767676767677e-06, "loss": 0.4716, "step": 9675 }, { "epoch": 0.39, "learning_rate": 8.142626262626263e-06, "loss": 0.467, "step": 9700 }, { "epoch": 0.39, "learning_rate": 8.137575757575758e-06, "loss": 0.456, "step": 9725 }, { "epoch": 0.39, "learning_rate": 8.132525252525252e-06, "loss": 0.4694, "step": 9750 }, { "epoch": 0.39, "learning_rate": 8.127474747474748e-06, "loss": 0.4902, "step": 9775 }, { "epoch": 0.39, "learning_rate": 8.122424242424242e-06, "loss": 0.4852, "step": 9800 }, { "epoch": 0.39, "learning_rate": 8.117373737373738e-06, "loss": 0.4721, "step": 9825 }, { "epoch": 0.39, "learning_rate": 8.112323232323233e-06, "loss": 0.4712, "step": 9850 }, { "epoch": 0.4, "learning_rate": 8.107272727272729e-06, "loss": 0.4862, "step": 9875 }, { "epoch": 0.4, "learning_rate": 8.102222222222223e-06, "loss": 0.4626, "step": 9900 }, { "epoch": 0.4, "learning_rate": 8.097171717171717e-06, "loss": 0.4675, "step": 9925 }, { "epoch": 0.4, "learning_rate": 8.092121212121212e-06, "loss": 0.4686, "step": 9950 }, { "epoch": 0.4, "learning_rate": 8.087070707070708e-06, "loss": 0.455, "step": 9975 }, { "epoch": 0.4, "learning_rate": 8.082020202020204e-06, "loss": 0.474, "step": 10000 }, { "epoch": 0.4, "eval_loss": 0.4769977331161499, "eval_runtime": 328.2875, "eval_samples_per_second": 15.246, "eval_steps_per_second": 1.907, "eval_wer": 38.55335912100429, "step": 10000 }, { "epoch": 0.4, "learning_rate": 8.076969696969698e-06, "loss": 0.4679, "step": 10025 }, { "epoch": 0.4, "learning_rate": 8.071919191919194e-06, "loss": 0.4848, "step": 10050 }, { "epoch": 0.4, "learning_rate": 8.066868686868688e-06, "loss": 0.4654, "step": 10075 }, { "epoch": 0.41, "learning_rate": 8.061818181818182e-06, "loss": 0.4622, "step": 10100 }, { "epoch": 0.41, "learning_rate": 8.056767676767677e-06, "loss": 0.4658, "step": 10125 }, { "epoch": 0.41, "learning_rate": 8.051717171717173e-06, "loss": 0.4618, "step": 10150 }, { "epoch": 0.41, "learning_rate": 8.046666666666667e-06, "loss": 0.4523, "step": 10175 }, { "epoch": 0.41, "learning_rate": 8.041616161616163e-06, "loss": 0.4575, "step": 10200 }, { "epoch": 0.41, "learning_rate": 8.036565656565657e-06, "loss": 0.4779, "step": 10225 }, { "epoch": 0.41, "learning_rate": 8.031515151515152e-06, "loss": 0.4713, "step": 10250 }, { "epoch": 0.41, "learning_rate": 8.026464646464648e-06, "loss": 0.4525, "step": 10275 }, { "epoch": 0.41, "learning_rate": 8.021414141414142e-06, "loss": 0.459, "step": 10300 }, { "epoch": 0.41, "learning_rate": 8.016363636363636e-06, "loss": 0.4714, "step": 10325 }, { "epoch": 0.42, "learning_rate": 8.011313131313132e-06, "loss": 0.4553, "step": 10350 }, { "epoch": 0.42, "learning_rate": 8.006262626262626e-06, "loss": 0.4742, "step": 10375 }, { "epoch": 0.42, "learning_rate": 8.001212121212122e-06, "loss": 0.4661, "step": 10400 }, { "epoch": 0.42, "learning_rate": 7.996161616161617e-06, "loss": 0.4629, "step": 10425 }, { "epoch": 0.42, "learning_rate": 7.991111111111111e-06, "loss": 0.4588, "step": 10450 }, { "epoch": 0.42, "learning_rate": 7.986060606060607e-06, "loss": 0.4659, "step": 10475 }, { "epoch": 0.42, "learning_rate": 7.981010101010101e-06, "loss": 0.48, "step": 10500 }, { "epoch": 0.42, "learning_rate": 7.975959595959597e-06, "loss": 0.4733, "step": 10525 }, { "epoch": 0.42, "learning_rate": 7.970909090909092e-06, "loss": 0.453, "step": 10550 }, { "epoch": 0.42, "learning_rate": 7.965858585858588e-06, "loss": 0.4801, "step": 10575 }, { "epoch": 0.43, "learning_rate": 7.960808080808082e-06, "loss": 0.469, "step": 10600 }, { "epoch": 0.43, "learning_rate": 7.955959595959597e-06, "loss": 0.4507, "step": 10625 }, { "epoch": 0.43, "learning_rate": 7.950909090909092e-06, "loss": 0.4579, "step": 10650 }, { "epoch": 0.43, "learning_rate": 7.945858585858586e-06, "loss": 0.4767, "step": 10675 }, { "epoch": 0.43, "learning_rate": 7.94080808080808e-06, "loss": 0.4625, "step": 10700 }, { "epoch": 0.43, "learning_rate": 7.935757575757576e-06, "loss": 0.4727, "step": 10725 }, { "epoch": 0.43, "learning_rate": 7.93070707070707e-06, "loss": 0.4751, "step": 10750 }, { "epoch": 0.43, "learning_rate": 7.925656565656567e-06, "loss": 0.4682, "step": 10775 }, { "epoch": 0.43, "learning_rate": 7.920606060606061e-06, "loss": 0.4623, "step": 10800 }, { "epoch": 0.43, "learning_rate": 7.915555555555557e-06, "loss": 0.4775, "step": 10825 }, { "epoch": 0.44, "learning_rate": 7.910505050505051e-06, "loss": 0.4522, "step": 10850 }, { "epoch": 0.44, "learning_rate": 7.905454545454546e-06, "loss": 0.4873, "step": 10875 }, { "epoch": 0.44, "learning_rate": 7.90040404040404e-06, "loss": 0.4528, "step": 10900 }, { "epoch": 0.44, "learning_rate": 7.895353535353536e-06, "loss": 0.4521, "step": 10925 }, { "epoch": 0.44, "learning_rate": 7.890303030303032e-06, "loss": 0.4691, "step": 10950 }, { "epoch": 0.44, "learning_rate": 7.885252525252526e-06, "loss": 0.4294, "step": 10975 }, { "epoch": 0.44, "learning_rate": 7.880202020202022e-06, "loss": 0.4611, "step": 11000 }, { "epoch": 0.44, "learning_rate": 7.875151515151516e-06, "loss": 0.4458, "step": 11025 }, { "epoch": 0.44, "learning_rate": 7.87010101010101e-06, "loss": 0.4761, "step": 11050 }, { "epoch": 0.44, "learning_rate": 7.865050505050505e-06, "loss": 0.4584, "step": 11075 }, { "epoch": 0.45, "learning_rate": 7.860000000000001e-06, "loss": 0.4644, "step": 11100 }, { "epoch": 0.45, "learning_rate": 7.854949494949495e-06, "loss": 0.4633, "step": 11125 }, { "epoch": 0.45, "learning_rate": 7.849898989898991e-06, "loss": 0.4631, "step": 11150 }, { "epoch": 0.45, "learning_rate": 7.844848484848486e-06, "loss": 0.4461, "step": 11175 }, { "epoch": 0.45, "learning_rate": 7.83979797979798e-06, "loss": 0.4874, "step": 11200 }, { "epoch": 0.45, "learning_rate": 7.834747474747474e-06, "loss": 0.469, "step": 11225 }, { "epoch": 0.45, "learning_rate": 7.82969696969697e-06, "loss": 0.4195, "step": 11250 }, { "epoch": 0.45, "learning_rate": 7.824646464646464e-06, "loss": 0.4769, "step": 11275 }, { "epoch": 0.45, "learning_rate": 7.81959595959596e-06, "loss": 0.465, "step": 11300 }, { "epoch": 0.45, "learning_rate": 7.814545454545455e-06, "loss": 0.464, "step": 11325 }, { "epoch": 0.46, "learning_rate": 7.80949494949495e-06, "loss": 0.4559, "step": 11350 }, { "epoch": 0.46, "learning_rate": 7.804444444444445e-06, "loss": 0.466, "step": 11375 }, { "epoch": 0.46, "learning_rate": 7.79939393939394e-06, "loss": 0.4683, "step": 11400 }, { "epoch": 0.46, "learning_rate": 7.794343434343435e-06, "loss": 0.4619, "step": 11425 }, { "epoch": 0.46, "learning_rate": 7.78929292929293e-06, "loss": 0.457, "step": 11450 }, { "epoch": 0.46, "learning_rate": 7.784242424242426e-06, "loss": 0.4535, "step": 11475 }, { "epoch": 0.46, "learning_rate": 7.77919191919192e-06, "loss": 0.4749, "step": 11500 }, { "epoch": 0.46, "learning_rate": 7.774141414141416e-06, "loss": 0.4634, "step": 11525 }, { "epoch": 0.46, "learning_rate": 7.76909090909091e-06, "loss": 0.4517, "step": 11550 }, { "epoch": 0.46, "learning_rate": 7.764040404040404e-06, "loss": 0.457, "step": 11575 }, { "epoch": 0.47, "learning_rate": 7.758989898989899e-06, "loss": 0.464, "step": 11600 }, { "epoch": 0.47, "learning_rate": 7.753939393939395e-06, "loss": 0.4606, "step": 11625 }, { "epoch": 0.47, "learning_rate": 7.748888888888889e-06, "loss": 0.4593, "step": 11650 }, { "epoch": 0.47, "learning_rate": 7.743838383838385e-06, "loss": 0.4581, "step": 11675 }, { "epoch": 0.47, "learning_rate": 7.73878787878788e-06, "loss": 0.4554, "step": 11700 }, { "epoch": 0.47, "learning_rate": 7.733737373737374e-06, "loss": 0.4449, "step": 11725 }, { "epoch": 0.47, "learning_rate": 7.72868686868687e-06, "loss": 0.4626, "step": 11750 }, { "epoch": 0.47, "learning_rate": 7.723636363636364e-06, "loss": 0.4584, "step": 11775 }, { "epoch": 0.47, "learning_rate": 7.71858585858586e-06, "loss": 0.4659, "step": 11800 }, { "epoch": 0.47, "learning_rate": 7.713535353535354e-06, "loss": 0.459, "step": 11825 }, { "epoch": 0.48, "learning_rate": 7.70848484848485e-06, "loss": 0.463, "step": 11850 }, { "epoch": 0.48, "learning_rate": 7.703434343434344e-06, "loss": 0.4443, "step": 11875 }, { "epoch": 0.48, "learning_rate": 7.698383838383839e-06, "loss": 0.4517, "step": 11900 }, { "epoch": 0.48, "learning_rate": 7.693333333333333e-06, "loss": 0.4524, "step": 11925 }, { "epoch": 0.48, "learning_rate": 7.688282828282829e-06, "loss": 0.4523, "step": 11950 }, { "epoch": 0.48, "learning_rate": 7.683232323232323e-06, "loss": 0.4685, "step": 11975 }, { "epoch": 0.48, "learning_rate": 7.67818181818182e-06, "loss": 0.4485, "step": 12000 }, { "epoch": 0.48, "learning_rate": 7.673131313131314e-06, "loss": 0.4742, "step": 12025 }, { "epoch": 0.48, "learning_rate": 7.66808080808081e-06, "loss": 0.4501, "step": 12050 }, { "epoch": 0.48, "learning_rate": 7.663030303030304e-06, "loss": 0.4459, "step": 12075 }, { "epoch": 0.49, "learning_rate": 7.657979797979798e-06, "loss": 0.4643, "step": 12100 }, { "epoch": 0.49, "learning_rate": 7.652929292929293e-06, "loss": 0.4588, "step": 12125 }, { "epoch": 0.49, "learning_rate": 7.647878787878789e-06, "loss": 0.4591, "step": 12150 }, { "epoch": 0.49, "learning_rate": 7.642828282828283e-06, "loss": 0.4493, "step": 12175 }, { "epoch": 0.49, "learning_rate": 7.637777777777779e-06, "loss": 0.456, "step": 12200 }, { "epoch": 0.49, "learning_rate": 7.632727272727273e-06, "loss": 0.4726, "step": 12225 }, { "epoch": 0.49, "learning_rate": 7.627676767676768e-06, "loss": 0.4447, "step": 12250 }, { "epoch": 0.49, "learning_rate": 7.622626262626263e-06, "loss": 0.4495, "step": 12275 }, { "epoch": 0.49, "learning_rate": 7.617575757575758e-06, "loss": 0.4478, "step": 12300 }, { "epoch": 0.49, "learning_rate": 7.612525252525254e-06, "loss": 0.4667, "step": 12325 }, { "epoch": 0.5, "learning_rate": 7.607474747474748e-06, "loss": 0.4626, "step": 12350 }, { "epoch": 0.5, "learning_rate": 7.602424242424243e-06, "loss": 0.4549, "step": 12375 }, { "epoch": 0.5, "learning_rate": 7.597373737373737e-06, "loss": 0.4582, "step": 12400 }, { "epoch": 0.5, "learning_rate": 7.592323232323233e-06, "loss": 0.4496, "step": 12425 }, { "epoch": 0.5, "learning_rate": 7.587272727272728e-06, "loss": 0.4604, "step": 12450 }, { "epoch": 0.5, "learning_rate": 7.582222222222223e-06, "loss": 0.4592, "step": 12475 }, { "epoch": 0.5, "learning_rate": 7.577171717171717e-06, "loss": 0.4696, "step": 12500 }, { "epoch": 0.5, "eval_loss": 0.4565899670124054, "eval_runtime": 321.107, "eval_samples_per_second": 15.587, "eval_steps_per_second": 1.95, "eval_wer": 36.25145352286481, "step": 12500 }, { "epoch": 0.5, "learning_rate": 7.572121212121213e-06, "loss": 0.4294, "step": 12525 }, { "epoch": 0.5, "learning_rate": 7.5670707070707074e-06, "loss": 0.4358, "step": 12550 }, { "epoch": 0.5, "learning_rate": 7.5620202020202026e-06, "loss": 0.4569, "step": 12575 }, { "epoch": 0.51, "learning_rate": 7.556969696969697e-06, "loss": 0.4464, "step": 12600 }, { "epoch": 0.51, "learning_rate": 7.551919191919193e-06, "loss": 0.4645, "step": 12625 }, { "epoch": 0.51, "learning_rate": 7.547070707070708e-06, "loss": 0.4547, "step": 12650 }, { "epoch": 0.51, "learning_rate": 7.542020202020203e-06, "loss": 0.4748, "step": 12675 }, { "epoch": 0.51, "learning_rate": 7.536969696969697e-06, "loss": 0.4344, "step": 12700 }, { "epoch": 0.51, "learning_rate": 7.531919191919192e-06, "loss": 0.4418, "step": 12725 }, { "epoch": 0.51, "learning_rate": 7.526868686868688e-06, "loss": 0.4521, "step": 12750 }, { "epoch": 0.51, "learning_rate": 7.5218181818181825e-06, "loss": 0.4655, "step": 12775 }, { "epoch": 0.51, "learning_rate": 7.516767676767678e-06, "loss": 0.4499, "step": 12800 }, { "epoch": 0.51, "learning_rate": 7.511717171717172e-06, "loss": 0.4473, "step": 12825 }, { "epoch": 0.52, "learning_rate": 7.506666666666668e-06, "loss": 0.436, "step": 12850 }, { "epoch": 0.52, "learning_rate": 7.501616161616162e-06, "loss": 0.4446, "step": 12875 }, { "epoch": 0.52, "learning_rate": 7.496565656565657e-06, "loss": 0.4504, "step": 12900 }, { "epoch": 0.52, "learning_rate": 7.491515151515152e-06, "loss": 0.4611, "step": 12925 }, { "epoch": 0.52, "learning_rate": 7.486464646464648e-06, "loss": 0.4572, "step": 12950 }, { "epoch": 0.52, "learning_rate": 7.481414141414142e-06, "loss": 0.4517, "step": 12975 }, { "epoch": 0.52, "learning_rate": 7.476363636363637e-06, "loss": 0.4624, "step": 13000 }, { "epoch": 0.52, "learning_rate": 7.471313131313131e-06, "loss": 0.4618, "step": 13025 }, { "epoch": 0.52, "learning_rate": 7.466262626262627e-06, "loss": 0.4608, "step": 13050 }, { "epoch": 0.52, "learning_rate": 7.461212121212122e-06, "loss": 0.4573, "step": 13075 }, { "epoch": 0.53, "learning_rate": 7.456161616161617e-06, "loss": 0.4477, "step": 13100 }, { "epoch": 0.53, "learning_rate": 7.451111111111111e-06, "loss": 0.453, "step": 13125 }, { "epoch": 0.53, "learning_rate": 7.446060606060606e-06, "loss": 0.4737, "step": 13150 }, { "epoch": 0.53, "learning_rate": 7.441010101010102e-06, "loss": 0.4351, "step": 13175 }, { "epoch": 0.53, "learning_rate": 7.4359595959595965e-06, "loss": 0.4378, "step": 13200 }, { "epoch": 0.53, "learning_rate": 7.430909090909092e-06, "loss": 0.4598, "step": 13225 }, { "epoch": 0.53, "learning_rate": 7.425858585858586e-06, "loss": 0.4454, "step": 13250 }, { "epoch": 0.53, "learning_rate": 7.420808080808082e-06, "loss": 0.4307, "step": 13275 }, { "epoch": 0.53, "learning_rate": 7.415757575757576e-06, "loss": 0.4513, "step": 13300 }, { "epoch": 0.53, "learning_rate": 7.410707070707071e-06, "loss": 0.4448, "step": 13325 }, { "epoch": 0.54, "learning_rate": 7.405656565656566e-06, "loss": 0.452, "step": 13350 }, { "epoch": 0.54, "learning_rate": 7.400606060606062e-06, "loss": 0.4399, "step": 13375 }, { "epoch": 0.54, "learning_rate": 7.395555555555556e-06, "loss": 0.432, "step": 13400 }, { "epoch": 0.54, "learning_rate": 7.390505050505051e-06, "loss": 0.4261, "step": 13425 }, { "epoch": 0.54, "learning_rate": 7.3854545454545454e-06, "loss": 0.4497, "step": 13450 }, { "epoch": 0.54, "learning_rate": 7.380404040404041e-06, "loss": 0.4483, "step": 13475 }, { "epoch": 0.54, "learning_rate": 7.375353535353536e-06, "loss": 0.4701, "step": 13500 }, { "epoch": 0.54, "learning_rate": 7.370303030303031e-06, "loss": 0.4214, "step": 13525 }, { "epoch": 0.54, "learning_rate": 7.365252525252525e-06, "loss": 0.4399, "step": 13550 }, { "epoch": 0.54, "learning_rate": 7.360202020202021e-06, "loss": 0.4282, "step": 13575 }, { "epoch": 0.55, "learning_rate": 7.355151515151516e-06, "loss": 0.4441, "step": 13600 }, { "epoch": 0.55, "learning_rate": 7.350101010101011e-06, "loss": 0.4249, "step": 13625 }, { "epoch": 0.55, "learning_rate": 7.345050505050506e-06, "loss": 0.4295, "step": 13650 }, { "epoch": 0.55, "learning_rate": 7.340000000000001e-06, "loss": 0.4408, "step": 13675 }, { "epoch": 0.55, "learning_rate": 7.334949494949496e-06, "loss": 0.4572, "step": 13700 }, { "epoch": 0.55, "learning_rate": 7.32989898989899e-06, "loss": 0.4507, "step": 13725 }, { "epoch": 0.55, "learning_rate": 7.3248484848484855e-06, "loss": 0.4469, "step": 13750 }, { "epoch": 0.55, "learning_rate": 7.31979797979798e-06, "loss": 0.4359, "step": 13775 }, { "epoch": 0.55, "learning_rate": 7.314747474747476e-06, "loss": 0.4609, "step": 13800 }, { "epoch": 0.55, "learning_rate": 7.30969696969697e-06, "loss": 0.4651, "step": 13825 }, { "epoch": 0.56, "learning_rate": 7.304646464646465e-06, "loss": 0.443, "step": 13850 }, { "epoch": 0.56, "learning_rate": 7.2995959595959595e-06, "loss": 0.4593, "step": 13875 }, { "epoch": 0.56, "learning_rate": 7.2945454545454555e-06, "loss": 0.4594, "step": 13900 }, { "epoch": 0.56, "learning_rate": 7.28949494949495e-06, "loss": 0.419, "step": 13925 }, { "epoch": 0.56, "learning_rate": 7.284444444444445e-06, "loss": 0.4348, "step": 13950 }, { "epoch": 0.56, "learning_rate": 7.279393939393939e-06, "loss": 0.4551, "step": 13975 }, { "epoch": 0.56, "learning_rate": 7.274343434343435e-06, "loss": 0.4223, "step": 14000 }, { "epoch": 0.56, "learning_rate": 7.26929292929293e-06, "loss": 0.4658, "step": 14025 }, { "epoch": 0.56, "learning_rate": 7.264242424242425e-06, "loss": 0.4239, "step": 14050 }, { "epoch": 0.56, "learning_rate": 7.259191919191921e-06, "loss": 0.4249, "step": 14075 }, { "epoch": 0.57, "learning_rate": 7.254141414141415e-06, "loss": 0.4387, "step": 14100 }, { "epoch": 0.57, "learning_rate": 7.24909090909091e-06, "loss": 0.4284, "step": 14125 }, { "epoch": 0.57, "learning_rate": 7.244040404040404e-06, "loss": 0.4468, "step": 14150 }, { "epoch": 0.57, "learning_rate": 7.2389898989898995e-06, "loss": 0.4401, "step": 14175 }, { "epoch": 0.57, "learning_rate": 7.233939393939395e-06, "loss": 0.4362, "step": 14200 }, { "epoch": 0.57, "learning_rate": 7.22888888888889e-06, "loss": 0.4445, "step": 14225 }, { "epoch": 0.57, "learning_rate": 7.223838383838384e-06, "loss": 0.4435, "step": 14250 }, { "epoch": 0.57, "learning_rate": 7.218787878787879e-06, "loss": 0.4479, "step": 14275 }, { "epoch": 0.57, "learning_rate": 7.2137373737373735e-06, "loss": 0.4286, "step": 14300 }, { "epoch": 0.57, "learning_rate": 7.2086868686868695e-06, "loss": 0.428, "step": 14325 }, { "epoch": 0.58, "learning_rate": 7.203636363636364e-06, "loss": 0.4405, "step": 14350 }, { "epoch": 0.58, "learning_rate": 7.198585858585859e-06, "loss": 0.4454, "step": 14375 }, { "epoch": 0.58, "learning_rate": 7.193535353535353e-06, "loss": 0.4483, "step": 14400 }, { "epoch": 0.58, "learning_rate": 7.188484848484849e-06, "loss": 0.4449, "step": 14425 }, { "epoch": 0.58, "learning_rate": 7.183434343434344e-06, "loss": 0.4274, "step": 14450 }, { "epoch": 0.58, "learning_rate": 7.178383838383839e-06, "loss": 0.4208, "step": 14475 }, { "epoch": 0.58, "learning_rate": 7.173333333333335e-06, "loss": 0.4435, "step": 14500 }, { "epoch": 0.58, "learning_rate": 7.168282828282829e-06, "loss": 0.4329, "step": 14525 }, { "epoch": 0.58, "learning_rate": 7.163232323232324e-06, "loss": 0.3995, "step": 14550 }, { "epoch": 0.58, "learning_rate": 7.158181818181818e-06, "loss": 0.4609, "step": 14575 }, { "epoch": 0.59, "learning_rate": 7.153131313131314e-06, "loss": 0.4638, "step": 14600 }, { "epoch": 0.59, "learning_rate": 7.148080808080809e-06, "loss": 0.4249, "step": 14625 }, { "epoch": 0.59, "learning_rate": 7.143030303030304e-06, "loss": 0.4154, "step": 14650 }, { "epoch": 0.59, "learning_rate": 7.138181818181819e-06, "loss": 0.4388, "step": 14675 }, { "epoch": 0.59, "learning_rate": 7.133131313131314e-06, "loss": 0.4264, "step": 14700 }, { "epoch": 0.59, "learning_rate": 7.128080808080808e-06, "loss": 0.4408, "step": 14725 }, { "epoch": 0.59, "learning_rate": 7.123030303030304e-06, "loss": 0.4335, "step": 14750 }, { "epoch": 0.59, "learning_rate": 7.117979797979798e-06, "loss": 0.4502, "step": 14775 }, { "epoch": 0.59, "learning_rate": 7.1129292929292935e-06, "loss": 0.454, "step": 14800 }, { "epoch": 0.59, "learning_rate": 7.107878787878788e-06, "loss": 0.4547, "step": 14825 }, { "epoch": 0.6, "learning_rate": 7.102828282828284e-06, "loss": 0.4403, "step": 14850 }, { "epoch": 0.6, "learning_rate": 7.097777777777778e-06, "loss": 0.4273, "step": 14875 }, { "epoch": 0.6, "learning_rate": 7.092727272727273e-06, "loss": 0.4314, "step": 14900 }, { "epoch": 0.6, "learning_rate": 7.0876767676767675e-06, "loss": 0.4355, "step": 14925 }, { "epoch": 0.6, "learning_rate": 7.0826262626262635e-06, "loss": 0.4381, "step": 14950 }, { "epoch": 0.6, "learning_rate": 7.077575757575759e-06, "loss": 0.4259, "step": 14975 }, { "epoch": 0.6, "learning_rate": 7.072525252525253e-06, "loss": 0.4312, "step": 15000 }, { "epoch": 0.6, "eval_loss": 0.4432617723941803, "eval_runtime": 329.2864, "eval_samples_per_second": 15.2, "eval_steps_per_second": 1.901, "eval_wer": 36.87795154132751, "step": 15000 }, { "epoch": 0.6, "learning_rate": 7.067474747474748e-06, "loss": 0.4423, "step": 15025 }, { "epoch": 0.6, "learning_rate": 7.062424242424243e-06, "loss": 0.4302, "step": 15050 }, { "epoch": 0.6, "learning_rate": 7.057373737373738e-06, "loss": 0.441, "step": 15075 }, { "epoch": 0.61, "learning_rate": 7.052323232323233e-06, "loss": 0.4281, "step": 15100 }, { "epoch": 0.61, "learning_rate": 7.047272727272728e-06, "loss": 0.4295, "step": 15125 }, { "epoch": 0.61, "learning_rate": 7.042222222222223e-06, "loss": 0.4268, "step": 15150 }, { "epoch": 0.61, "learning_rate": 7.037171717171718e-06, "loss": 0.4347, "step": 15175 }, { "epoch": 0.61, "learning_rate": 7.032121212121212e-06, "loss": 0.4463, "step": 15200 }, { "epoch": 0.61, "learning_rate": 7.0270707070707075e-06, "loss": 0.425, "step": 15225 }, { "epoch": 0.61, "learning_rate": 7.022020202020202e-06, "loss": 0.4393, "step": 15250 }, { "epoch": 0.61, "learning_rate": 7.016969696969698e-06, "loss": 0.4356, "step": 15275 }, { "epoch": 0.61, "learning_rate": 7.011919191919192e-06, "loss": 0.4228, "step": 15300 }, { "epoch": 0.61, "learning_rate": 7.006868686868687e-06, "loss": 0.428, "step": 15325 }, { "epoch": 0.62, "learning_rate": 7.0018181818181815e-06, "loss": 0.4418, "step": 15350 }, { "epoch": 0.62, "learning_rate": 6.9967676767676775e-06, "loss": 0.4257, "step": 15375 }, { "epoch": 0.62, "learning_rate": 6.991717171717173e-06, "loss": 0.4362, "step": 15400 }, { "epoch": 0.62, "learning_rate": 6.986666666666667e-06, "loss": 0.4321, "step": 15425 }, { "epoch": 0.62, "learning_rate": 6.981616161616163e-06, "loss": 0.4244, "step": 15450 }, { "epoch": 0.62, "learning_rate": 6.976565656565657e-06, "loss": 0.4297, "step": 15475 }, { "epoch": 0.62, "learning_rate": 6.971515151515152e-06, "loss": 0.4245, "step": 15500 }, { "epoch": 0.62, "learning_rate": 6.966464646464647e-06, "loss": 0.426, "step": 15525 }, { "epoch": 0.62, "learning_rate": 6.961414141414143e-06, "loss": 0.4475, "step": 15550 }, { "epoch": 0.62, "learning_rate": 6.956363636363637e-06, "loss": 0.4407, "step": 15575 }, { "epoch": 0.63, "learning_rate": 6.951313131313132e-06, "loss": 0.4298, "step": 15600 }, { "epoch": 0.63, "learning_rate": 6.9462626262626264e-06, "loss": 0.4157, "step": 15625 }, { "epoch": 0.63, "learning_rate": 6.9412121212121216e-06, "loss": 0.4288, "step": 15650 }, { "epoch": 0.63, "learning_rate": 6.936161616161617e-06, "loss": 0.4294, "step": 15675 }, { "epoch": 0.63, "learning_rate": 6.931111111111112e-06, "loss": 0.4231, "step": 15700 }, { "epoch": 0.63, "learning_rate": 6.926060606060606e-06, "loss": 0.4392, "step": 15725 }, { "epoch": 0.63, "learning_rate": 6.921010101010101e-06, "loss": 0.4144, "step": 15750 }, { "epoch": 0.63, "learning_rate": 6.915959595959596e-06, "loss": 0.4438, "step": 15775 }, { "epoch": 0.63, "learning_rate": 6.910909090909092e-06, "loss": 0.4181, "step": 15800 }, { "epoch": 0.63, "learning_rate": 6.905858585858587e-06, "loss": 0.4177, "step": 15825 }, { "epoch": 0.64, "learning_rate": 6.900808080808081e-06, "loss": 0.4319, "step": 15850 }, { "epoch": 0.64, "learning_rate": 6.895757575757577e-06, "loss": 0.432, "step": 15875 }, { "epoch": 0.64, "learning_rate": 6.890707070707071e-06, "loss": 0.4332, "step": 15900 }, { "epoch": 0.64, "learning_rate": 6.8856565656565664e-06, "loss": 0.4174, "step": 15925 }, { "epoch": 0.64, "learning_rate": 6.880606060606061e-06, "loss": 0.4543, "step": 15950 }, { "epoch": 0.64, "learning_rate": 6.875555555555557e-06, "loss": 0.4187, "step": 15975 }, { "epoch": 0.64, "learning_rate": 6.870505050505051e-06, "loss": 0.4371, "step": 16000 }, { "epoch": 0.64, "learning_rate": 6.865454545454546e-06, "loss": 0.4377, "step": 16025 }, { "epoch": 0.64, "learning_rate": 6.8604040404040405e-06, "loss": 0.4432, "step": 16050 }, { "epoch": 0.64, "learning_rate": 6.8553535353535365e-06, "loss": 0.4261, "step": 16075 }, { "epoch": 0.65, "learning_rate": 6.850303030303031e-06, "loss": 0.436, "step": 16100 }, { "epoch": 0.65, "learning_rate": 6.845252525252526e-06, "loss": 0.4192, "step": 16125 }, { "epoch": 0.65, "learning_rate": 6.84020202020202e-06, "loss": 0.4363, "step": 16150 }, { "epoch": 0.65, "learning_rate": 6.835151515151515e-06, "loss": 0.4336, "step": 16175 }, { "epoch": 0.65, "learning_rate": 6.8301010101010105e-06, "loss": 0.4451, "step": 16200 }, { "epoch": 0.65, "learning_rate": 6.825050505050506e-06, "loss": 0.4131, "step": 16225 }, { "epoch": 0.65, "learning_rate": 6.820000000000001e-06, "loss": 0.4384, "step": 16250 }, { "epoch": 0.65, "learning_rate": 6.814949494949495e-06, "loss": 0.4177, "step": 16275 }, { "epoch": 0.65, "learning_rate": 6.809898989898991e-06, "loss": 0.4355, "step": 16300 }, { "epoch": 0.65, "learning_rate": 6.804848484848485e-06, "loss": 0.4168, "step": 16325 }, { "epoch": 0.66, "learning_rate": 6.7997979797979805e-06, "loss": 0.4193, "step": 16350 }, { "epoch": 0.66, "learning_rate": 6.794747474747475e-06, "loss": 0.417, "step": 16375 }, { "epoch": 0.66, "learning_rate": 6.789696969696971e-06, "loss": 0.4337, "step": 16400 }, { "epoch": 0.66, "learning_rate": 6.784646464646465e-06, "loss": 0.4253, "step": 16425 }, { "epoch": 0.66, "learning_rate": 6.77959595959596e-06, "loss": 0.421, "step": 16450 }, { "epoch": 0.66, "learning_rate": 6.7745454545454545e-06, "loss": 0.431, "step": 16475 }, { "epoch": 0.66, "learning_rate": 6.7694949494949505e-06, "loss": 0.4143, "step": 16500 }, { "epoch": 0.66, "learning_rate": 6.764444444444445e-06, "loss": 0.424, "step": 16525 }, { "epoch": 0.66, "learning_rate": 6.75939393939394e-06, "loss": 0.4172, "step": 16550 }, { "epoch": 0.66, "learning_rate": 6.754343434343434e-06, "loss": 0.434, "step": 16575 }, { "epoch": 0.67, "learning_rate": 6.74929292929293e-06, "loss": 0.4295, "step": 16600 }, { "epoch": 0.67, "learning_rate": 6.7442424242424245e-06, "loss": 0.4117, "step": 16625 }, { "epoch": 0.67, "learning_rate": 6.73919191919192e-06, "loss": 0.4188, "step": 16650 }, { "epoch": 0.67, "learning_rate": 6.734141414141415e-06, "loss": 0.4356, "step": 16675 }, { "epoch": 0.67, "learning_rate": 6.72909090909091e-06, "loss": 0.4422, "step": 16700 }, { "epoch": 0.67, "learning_rate": 6.724040404040405e-06, "loss": 0.4236, "step": 16725 }, { "epoch": 0.67, "learning_rate": 6.718989898989899e-06, "loss": 0.4122, "step": 16750 }, { "epoch": 0.67, "learning_rate": 6.714141414141415e-06, "loss": 0.4019, "step": 16775 }, { "epoch": 0.67, "learning_rate": 6.709090909090909e-06, "loss": 0.4294, "step": 16800 }, { "epoch": 0.67, "learning_rate": 6.704040404040405e-06, "loss": 0.425, "step": 16825 }, { "epoch": 0.68, "learning_rate": 6.6989898989899e-06, "loss": 0.4389, "step": 16850 }, { "epoch": 0.68, "learning_rate": 6.693939393939395e-06, "loss": 0.4441, "step": 16875 }, { "epoch": 0.68, "learning_rate": 6.688888888888889e-06, "loss": 0.4154, "step": 16900 }, { "epoch": 0.68, "learning_rate": 6.683838383838385e-06, "loss": 0.4263, "step": 16925 }, { "epoch": 0.68, "learning_rate": 6.678787878787879e-06, "loss": 0.4035, "step": 16950 }, { "epoch": 0.68, "learning_rate": 6.6737373737373745e-06, "loss": 0.4229, "step": 16975 }, { "epoch": 0.68, "learning_rate": 6.668686868686869e-06, "loss": 0.4078, "step": 17000 }, { "epoch": 0.68, "learning_rate": 6.663636363636365e-06, "loss": 0.4294, "step": 17025 }, { "epoch": 0.68, "learning_rate": 6.658585858585859e-06, "loss": 0.436, "step": 17050 }, { "epoch": 0.68, "learning_rate": 6.653535353535354e-06, "loss": 0.4341, "step": 17075 }, { "epoch": 0.69, "learning_rate": 6.6484848484848485e-06, "loss": 0.4185, "step": 17100 }, { "epoch": 0.69, "learning_rate": 6.643434343434344e-06, "loss": 0.427, "step": 17125 }, { "epoch": 0.69, "learning_rate": 6.638383838383839e-06, "loss": 0.4318, "step": 17150 }, { "epoch": 0.69, "learning_rate": 6.633333333333334e-06, "loss": 0.4168, "step": 17175 }, { "epoch": 0.69, "learning_rate": 6.628282828282829e-06, "loss": 0.424, "step": 17200 }, { "epoch": 0.69, "learning_rate": 6.623232323232323e-06, "loss": 0.4291, "step": 17225 }, { "epoch": 0.69, "learning_rate": 6.618181818181819e-06, "loss": 0.4211, "step": 17250 }, { "epoch": 0.69, "learning_rate": 6.613131313131314e-06, "loss": 0.4157, "step": 17275 }, { "epoch": 0.69, "learning_rate": 6.608080808080809e-06, "loss": 0.4334, "step": 17300 }, { "epoch": 0.69, "learning_rate": 6.603030303030303e-06, "loss": 0.4164, "step": 17325 }, { "epoch": 0.7, "learning_rate": 6.597979797979799e-06, "loss": 0.4346, "step": 17350 }, { "epoch": 0.7, "learning_rate": 6.592929292929293e-06, "loss": 0.4317, "step": 17375 }, { "epoch": 0.7, "learning_rate": 6.5878787878787885e-06, "loss": 0.439, "step": 17400 }, { "epoch": 0.7, "learning_rate": 6.582828282828283e-06, "loss": 0.4302, "step": 17425 }, { "epoch": 0.7, "learning_rate": 6.577777777777779e-06, "loss": 0.4337, "step": 17450 }, { "epoch": 0.7, "learning_rate": 6.572727272727273e-06, "loss": 0.4033, "step": 17475 }, { "epoch": 0.7, "learning_rate": 6.567676767676768e-06, "loss": 0.4208, "step": 17500 }, { "epoch": 0.7, "eval_loss": 0.43082931637763977, "eval_runtime": 307.9947, "eval_samples_per_second": 16.25, "eval_steps_per_second": 2.033, "eval_wer": 32.371437385794636, "step": 17500 }, { "epoch": 0.7, "learning_rate": 6.5626262626262625e-06, "loss": 0.4161, "step": 17525 }, { "epoch": 0.7, "learning_rate": 6.5575757575757585e-06, "loss": 0.4151, "step": 17550 }, { "epoch": 0.7, "learning_rate": 6.552525252525253e-06, "loss": 0.4389, "step": 17575 }, { "epoch": 0.71, "learning_rate": 6.547474747474748e-06, "loss": 0.4413, "step": 17600 }, { "epoch": 0.71, "learning_rate": 6.542424242424243e-06, "loss": 0.4208, "step": 17625 }, { "epoch": 0.71, "learning_rate": 6.537373737373737e-06, "loss": 0.4272, "step": 17650 }, { "epoch": 0.71, "learning_rate": 6.532323232323233e-06, "loss": 0.4095, "step": 17675 }, { "epoch": 0.71, "learning_rate": 6.527272727272728e-06, "loss": 0.431, "step": 17700 }, { "epoch": 0.71, "learning_rate": 6.522222222222223e-06, "loss": 0.4285, "step": 17725 }, { "epoch": 0.71, "learning_rate": 6.517171717171717e-06, "loss": 0.4086, "step": 17750 }, { "epoch": 0.71, "learning_rate": 6.512121212121213e-06, "loss": 0.435, "step": 17775 }, { "epoch": 0.71, "learning_rate": 6.507070707070707e-06, "loss": 0.4134, "step": 17800 }, { "epoch": 0.71, "learning_rate": 6.5020202020202026e-06, "loss": 0.4181, "step": 17825 }, { "epoch": 0.72, "learning_rate": 6.496969696969697e-06, "loss": 0.3998, "step": 17850 }, { "epoch": 0.72, "learning_rate": 6.491919191919193e-06, "loss": 0.4095, "step": 17875 }, { "epoch": 0.72, "learning_rate": 6.486868686868687e-06, "loss": 0.4344, "step": 17900 }, { "epoch": 0.72, "learning_rate": 6.481818181818182e-06, "loss": 0.4049, "step": 17925 }, { "epoch": 0.72, "learning_rate": 6.476767676767677e-06, "loss": 0.4204, "step": 17950 }, { "epoch": 0.72, "learning_rate": 6.4717171717171726e-06, "loss": 0.4377, "step": 17975 }, { "epoch": 0.72, "learning_rate": 6.466666666666667e-06, "loss": 0.4247, "step": 18000 }, { "epoch": 0.72, "learning_rate": 6.461616161616162e-06, "loss": 0.4249, "step": 18025 }, { "epoch": 0.72, "learning_rate": 6.456565656565658e-06, "loss": 0.4067, "step": 18050 }, { "epoch": 0.72, "learning_rate": 6.451515151515152e-06, "loss": 0.4149, "step": 18075 }, { "epoch": 0.73, "learning_rate": 6.4464646464646474e-06, "loss": 0.4059, "step": 18100 }, { "epoch": 0.73, "learning_rate": 6.441414141414142e-06, "loss": 0.4207, "step": 18125 }, { "epoch": 0.73, "learning_rate": 6.436363636363637e-06, "loss": 0.4135, "step": 18150 }, { "epoch": 0.73, "learning_rate": 6.431313131313132e-06, "loss": 0.4335, "step": 18175 }, { "epoch": 0.73, "learning_rate": 6.426262626262627e-06, "loss": 0.423, "step": 18200 }, { "epoch": 0.73, "learning_rate": 6.4212121212121215e-06, "loss": 0.4142, "step": 18225 }, { "epoch": 0.73, "learning_rate": 6.416161616161617e-06, "loss": 0.4417, "step": 18250 }, { "epoch": 0.73, "learning_rate": 6.411111111111111e-06, "loss": 0.424, "step": 18275 }, { "epoch": 0.73, "learning_rate": 6.406060606060607e-06, "loss": 0.4286, "step": 18300 }, { "epoch": 0.73, "learning_rate": 6.401010101010101e-06, "loss": 0.4143, "step": 18325 }, { "epoch": 0.74, "learning_rate": 6.395959595959596e-06, "loss": 0.4154, "step": 18350 }, { "epoch": 0.74, "learning_rate": 6.390909090909091e-06, "loss": 0.4065, "step": 18375 }, { "epoch": 0.74, "learning_rate": 6.385858585858587e-06, "loss": 0.4251, "step": 18400 }, { "epoch": 0.74, "learning_rate": 6.380808080808081e-06, "loss": 0.4203, "step": 18425 }, { "epoch": 0.74, "learning_rate": 6.375757575757576e-06, "loss": 0.3992, "step": 18450 }, { "epoch": 0.74, "learning_rate": 6.370707070707072e-06, "loss": 0.4243, "step": 18475 }, { "epoch": 0.74, "learning_rate": 6.365656565656566e-06, "loss": 0.4465, "step": 18500 }, { "epoch": 0.74, "learning_rate": 6.3606060606060615e-06, "loss": 0.4089, "step": 18525 }, { "epoch": 0.74, "learning_rate": 6.355555555555556e-06, "loss": 0.4242, "step": 18550 }, { "epoch": 0.74, "learning_rate": 6.350505050505052e-06, "loss": 0.4295, "step": 18575 }, { "epoch": 0.75, "learning_rate": 6.345454545454546e-06, "loss": 0.4053, "step": 18600 }, { "epoch": 0.75, "learning_rate": 6.340404040404041e-06, "loss": 0.4106, "step": 18625 }, { "epoch": 0.75, "learning_rate": 6.3353535353535355e-06, "loss": 0.4287, "step": 18650 }, { "epoch": 0.75, "learning_rate": 6.330303030303031e-06, "loss": 0.4265, "step": 18675 }, { "epoch": 0.75, "learning_rate": 6.325252525252526e-06, "loss": 0.4328, "step": 18700 }, { "epoch": 0.75, "learning_rate": 6.320202020202021e-06, "loss": 0.4071, "step": 18725 }, { "epoch": 0.75, "learning_rate": 6.315151515151515e-06, "loss": 0.4214, "step": 18750 }, { "epoch": 0.75, "learning_rate": 6.31010101010101e-06, "loss": 0.4108, "step": 18775 }, { "epoch": 0.75, "learning_rate": 6.305050505050505e-06, "loss": 0.4262, "step": 18800 }, { "epoch": 0.75, "learning_rate": 6.300000000000001e-06, "loss": 0.3884, "step": 18825 }, { "epoch": 0.76, "learning_rate": 6.294949494949495e-06, "loss": 0.411, "step": 18850 }, { "epoch": 0.76, "learning_rate": 6.28989898989899e-06, "loss": 0.4229, "step": 18875 }, { "epoch": 0.76, "learning_rate": 6.284848484848486e-06, "loss": 0.4252, "step": 18900 }, { "epoch": 0.76, "learning_rate": 6.27979797979798e-06, "loss": 0.4134, "step": 18925 }, { "epoch": 0.76, "learning_rate": 6.2747474747474755e-06, "loss": 0.4265, "step": 18950 }, { "epoch": 0.76, "learning_rate": 6.26969696969697e-06, "loss": 0.395, "step": 18975 }, { "epoch": 0.76, "learning_rate": 6.264646464646466e-06, "loss": 0.417, "step": 19000 }, { "epoch": 0.76, "learning_rate": 6.25959595959596e-06, "loss": 0.4259, "step": 19025 }, { "epoch": 0.76, "learning_rate": 6.254545454545455e-06, "loss": 0.4009, "step": 19050 }, { "epoch": 0.76, "learning_rate": 6.2494949494949496e-06, "loss": 0.399, "step": 19075 }, { "epoch": 0.77, "learning_rate": 6.2444444444444456e-06, "loss": 0.4098, "step": 19100 }, { "epoch": 0.77, "learning_rate": 6.23939393939394e-06, "loss": 0.4192, "step": 19125 }, { "epoch": 0.77, "learning_rate": 6.2345454545454555e-06, "loss": 0.4068, "step": 19150 }, { "epoch": 0.77, "learning_rate": 6.22949494949495e-06, "loss": 0.426, "step": 19175 }, { "epoch": 0.77, "learning_rate": 6.224444444444445e-06, "loss": 0.4072, "step": 19200 }, { "epoch": 0.77, "learning_rate": 6.219393939393939e-06, "loss": 0.4181, "step": 19225 }, { "epoch": 0.77, "learning_rate": 6.214343434343435e-06, "loss": 0.4127, "step": 19250 }, { "epoch": 0.77, "learning_rate": 6.2092929292929295e-06, "loss": 0.4244, "step": 19275 }, { "epoch": 0.77, "learning_rate": 6.204242424242425e-06, "loss": 0.4168, "step": 19300 }, { "epoch": 0.77, "learning_rate": 6.199191919191919e-06, "loss": 0.4112, "step": 19325 }, { "epoch": 0.78, "learning_rate": 6.194141414141415e-06, "loss": 0.4162, "step": 19350 }, { "epoch": 0.78, "learning_rate": 6.18909090909091e-06, "loss": 0.3985, "step": 19375 }, { "epoch": 0.78, "learning_rate": 6.184040404040404e-06, "loss": 0.428, "step": 19400 }, { "epoch": 0.78, "learning_rate": 6.1789898989899e-06, "loss": 0.4175, "step": 19425 }, { "epoch": 0.78, "learning_rate": 6.173939393939395e-06, "loss": 0.4138, "step": 19450 }, { "epoch": 0.78, "learning_rate": 6.16888888888889e-06, "loss": 0.3978, "step": 19475 }, { "epoch": 0.78, "learning_rate": 6.163838383838384e-06, "loss": 0.4213, "step": 19500 }, { "epoch": 0.78, "learning_rate": 6.15878787878788e-06, "loss": 0.408, "step": 19525 }, { "epoch": 0.78, "learning_rate": 6.153737373737374e-06, "loss": 0.4107, "step": 19550 }, { "epoch": 0.78, "learning_rate": 6.1486868686868695e-06, "loss": 0.4061, "step": 19575 }, { "epoch": 0.79, "learning_rate": 6.143636363636364e-06, "loss": 0.4142, "step": 19600 }, { "epoch": 0.79, "learning_rate": 6.138585858585859e-06, "loss": 0.4182, "step": 19625 }, { "epoch": 0.79, "learning_rate": 6.133535353535354e-06, "loss": 0.4174, "step": 19650 }, { "epoch": 0.79, "learning_rate": 6.128484848484849e-06, "loss": 0.4284, "step": 19675 }, { "epoch": 0.79, "learning_rate": 6.1234343434343435e-06, "loss": 0.4023, "step": 19700 }, { "epoch": 0.79, "learning_rate": 6.118383838383839e-06, "loss": 0.4249, "step": 19725 }, { "epoch": 0.79, "learning_rate": 6.113333333333333e-06, "loss": 0.4049, "step": 19750 }, { "epoch": 0.79, "learning_rate": 6.108282828282829e-06, "loss": 0.4137, "step": 19775 }, { "epoch": 0.79, "learning_rate": 6.103232323232324e-06, "loss": 0.4084, "step": 19800 }, { "epoch": 0.79, "learning_rate": 6.098181818181818e-06, "loss": 0.4209, "step": 19825 }, { "epoch": 0.8, "learning_rate": 6.093131313131314e-06, "loss": 0.4114, "step": 19850 }, { "epoch": 0.8, "learning_rate": 6.088080808080809e-06, "loss": 0.4121, "step": 19875 }, { "epoch": 0.8, "learning_rate": 6.083030303030304e-06, "loss": 0.4279, "step": 19900 }, { "epoch": 0.8, "learning_rate": 6.077979797979798e-06, "loss": 0.4275, "step": 19925 }, { "epoch": 0.8, "learning_rate": 6.072929292929294e-06, "loss": 0.4075, "step": 19950 }, { "epoch": 0.8, "learning_rate": 6.067878787878788e-06, "loss": 0.4179, "step": 19975 }, { "epoch": 0.8, "learning_rate": 6.0628282828282836e-06, "loss": 0.4089, "step": 20000 }, { "epoch": 0.8, "eval_loss": 0.4228692054748535, "eval_runtime": 313.9546, "eval_samples_per_second": 15.942, "eval_steps_per_second": 1.994, "eval_wer": 33.41085455278957, "step": 20000 }, { "epoch": 0.8, "learning_rate": 6.057777777777778e-06, "loss": 0.4367, "step": 20025 }, { "epoch": 0.8, "learning_rate": 6.052727272727274e-06, "loss": 0.4269, "step": 20050 }, { "epoch": 0.8, "learning_rate": 6.047676767676768e-06, "loss": 0.4196, "step": 20075 }, { "epoch": 0.81, "learning_rate": 6.042626262626263e-06, "loss": 0.4006, "step": 20100 }, { "epoch": 0.81, "learning_rate": 6.0375757575757576e-06, "loss": 0.4113, "step": 20125 }, { "epoch": 0.81, "learning_rate": 6.032525252525253e-06, "loss": 0.413, "step": 20150 }, { "epoch": 0.81, "learning_rate": 6.027474747474748e-06, "loss": 0.4234, "step": 20175 }, { "epoch": 0.81, "learning_rate": 6.022424242424243e-06, "loss": 0.424, "step": 20200 }, { "epoch": 0.81, "learning_rate": 6.017373737373737e-06, "loss": 0.4187, "step": 20225 }, { "epoch": 0.81, "learning_rate": 6.0123232323232324e-06, "loss": 0.4066, "step": 20250 }, { "epoch": 0.81, "learning_rate": 6.0072727272727284e-06, "loss": 0.4126, "step": 20275 }, { "epoch": 0.81, "learning_rate": 6.002222222222223e-06, "loss": 0.4026, "step": 20300 }, { "epoch": 0.82, "learning_rate": 5.997171717171718e-06, "loss": 0.3976, "step": 20325 }, { "epoch": 0.82, "learning_rate": 5.992121212121212e-06, "loss": 0.4272, "step": 20350 }, { "epoch": 0.82, "learning_rate": 5.987070707070708e-06, "loss": 0.4242, "step": 20375 }, { "epoch": 0.82, "learning_rate": 5.9820202020202025e-06, "loss": 0.4108, "step": 20400 }, { "epoch": 0.82, "learning_rate": 5.976969696969698e-06, "loss": 0.426, "step": 20425 }, { "epoch": 0.82, "learning_rate": 5.971919191919192e-06, "loss": 0.4276, "step": 20450 }, { "epoch": 0.82, "learning_rate": 5.966868686868688e-06, "loss": 0.4193, "step": 20475 }, { "epoch": 0.82, "learning_rate": 5.961818181818182e-06, "loss": 0.4073, "step": 20500 }, { "epoch": 0.82, "learning_rate": 5.956767676767677e-06, "loss": 0.4294, "step": 20525 }, { "epoch": 0.82, "learning_rate": 5.951717171717172e-06, "loss": 0.4127, "step": 20550 }, { "epoch": 0.83, "learning_rate": 5.946666666666668e-06, "loss": 0.4075, "step": 20575 }, { "epoch": 0.83, "learning_rate": 5.941616161616162e-06, "loss": 0.3962, "step": 20600 }, { "epoch": 0.83, "learning_rate": 5.936565656565657e-06, "loss": 0.414, "step": 20625 }, { "epoch": 0.83, "learning_rate": 5.931515151515151e-06, "loss": 0.4167, "step": 20650 }, { "epoch": 0.83, "learning_rate": 5.926464646464647e-06, "loss": 0.4155, "step": 20675 }, { "epoch": 0.83, "learning_rate": 5.9214141414141425e-06, "loss": 0.4072, "step": 20700 }, { "epoch": 0.83, "learning_rate": 5.916363636363637e-06, "loss": 0.4028, "step": 20725 }, { "epoch": 0.83, "learning_rate": 5.911313131313132e-06, "loss": 0.4195, "step": 20750 }, { "epoch": 0.83, "learning_rate": 5.906262626262626e-06, "loss": 0.4224, "step": 20775 }, { "epoch": 0.83, "learning_rate": 5.901212121212122e-06, "loss": 0.406, "step": 20800 }, { "epoch": 0.84, "learning_rate": 5.8961616161616165e-06, "loss": 0.4145, "step": 20825 }, { "epoch": 0.84, "learning_rate": 5.891111111111112e-06, "loss": 0.4041, "step": 20850 }, { "epoch": 0.84, "learning_rate": 5.886060606060606e-06, "loss": 0.4062, "step": 20875 }, { "epoch": 0.84, "learning_rate": 5.881010101010102e-06, "loss": 0.4046, "step": 20900 }, { "epoch": 0.84, "learning_rate": 5.875959595959596e-06, "loss": 0.4375, "step": 20925 }, { "epoch": 0.84, "learning_rate": 5.870909090909091e-06, "loss": 0.4266, "step": 20950 }, { "epoch": 0.84, "learning_rate": 5.865858585858586e-06, "loss": 0.4102, "step": 20975 }, { "epoch": 0.84, "learning_rate": 5.860808080808082e-06, "loss": 0.4138, "step": 21000 }, { "epoch": 0.84, "learning_rate": 5.855757575757576e-06, "loss": 0.4086, "step": 21025 }, { "epoch": 0.84, "learning_rate": 5.850707070707071e-06, "loss": 0.4002, "step": 21050 }, { "epoch": 0.85, "learning_rate": 5.845656565656565e-06, "loss": 0.3841, "step": 21075 }, { "epoch": 0.85, "learning_rate": 5.840606060606061e-06, "loss": 0.4017, "step": 21100 }, { "epoch": 0.85, "learning_rate": 5.8355555555555565e-06, "loss": 0.4092, "step": 21125 }, { "epoch": 0.85, "learning_rate": 5.830505050505051e-06, "loss": 0.4161, "step": 21150 }, { "epoch": 0.85, "learning_rate": 5.825454545454546e-06, "loss": 0.3923, "step": 21175 }, { "epoch": 0.85, "learning_rate": 5.820404040404041e-06, "loss": 0.4073, "step": 21200 }, { "epoch": 0.85, "learning_rate": 5.815353535353536e-06, "loss": 0.3931, "step": 21225 }, { "epoch": 0.85, "learning_rate": 5.8103030303030306e-06, "loss": 0.3999, "step": 21250 }, { "epoch": 0.85, "learning_rate": 5.805252525252526e-06, "loss": 0.3947, "step": 21275 }, { "epoch": 0.85, "learning_rate": 5.80020202020202e-06, "loss": 0.4091, "step": 21300 }, { "epoch": 0.86, "learning_rate": 5.795151515151516e-06, "loss": 0.3898, "step": 21325 }, { "epoch": 0.86, "learning_rate": 5.79010101010101e-06, "loss": 0.4089, "step": 21350 }, { "epoch": 0.86, "learning_rate": 5.785050505050505e-06, "loss": 0.4212, "step": 21375 }, { "epoch": 0.86, "learning_rate": 5.78e-06, "loss": 0.4273, "step": 21400 }, { "epoch": 0.86, "learning_rate": 5.774949494949496e-06, "loss": 0.422, "step": 21425 }, { "epoch": 0.86, "learning_rate": 5.76989898989899e-06, "loss": 0.4094, "step": 21450 }, { "epoch": 0.86, "learning_rate": 5.764848484848485e-06, "loss": 0.4442, "step": 21475 }, { "epoch": 0.86, "learning_rate": 5.7597979797979794e-06, "loss": 0.4052, "step": 21500 }, { "epoch": 0.86, "learning_rate": 5.7547474747474754e-06, "loss": 0.4111, "step": 21525 }, { "epoch": 0.86, "learning_rate": 5.749696969696971e-06, "loss": 0.417, "step": 21550 }, { "epoch": 0.87, "learning_rate": 5.744646464646465e-06, "loss": 0.3936, "step": 21575 }, { "epoch": 0.87, "learning_rate": 5.739595959595961e-06, "loss": 0.392, "step": 21600 }, { "epoch": 0.87, "learning_rate": 5.734545454545455e-06, "loss": 0.4233, "step": 21625 }, { "epoch": 0.87, "learning_rate": 5.72949494949495e-06, "loss": 0.3902, "step": 21650 }, { "epoch": 0.87, "learning_rate": 5.724444444444445e-06, "loss": 0.4107, "step": 21675 }, { "epoch": 0.87, "learning_rate": 5.71939393939394e-06, "loss": 0.4171, "step": 21700 }, { "epoch": 0.87, "learning_rate": 5.714343434343435e-06, "loss": 0.42, "step": 21725 }, { "epoch": 0.87, "learning_rate": 5.70929292929293e-06, "loss": 0.4245, "step": 21750 }, { "epoch": 0.87, "learning_rate": 5.704242424242424e-06, "loss": 0.417, "step": 21775 }, { "epoch": 0.87, "learning_rate": 5.6991919191919195e-06, "loss": 0.4052, "step": 21800 }, { "epoch": 0.88, "learning_rate": 5.694141414141415e-06, "loss": 0.4282, "step": 21825 }, { "epoch": 0.88, "learning_rate": 5.68909090909091e-06, "loss": 0.4263, "step": 21850 }, { "epoch": 0.88, "learning_rate": 5.684040404040404e-06, "loss": 0.4163, "step": 21875 }, { "epoch": 0.88, "learning_rate": 5.678989898989899e-06, "loss": 0.4095, "step": 21900 }, { "epoch": 0.88, "learning_rate": 5.6739393939393935e-06, "loss": 0.4134, "step": 21925 }, { "epoch": 0.88, "learning_rate": 5.6688888888888895e-06, "loss": 0.4124, "step": 21950 }, { "epoch": 0.88, "learning_rate": 5.663838383838385e-06, "loss": 0.3975, "step": 21975 }, { "epoch": 0.88, "learning_rate": 5.658787878787879e-06, "loss": 0.4044, "step": 22000 }, { "epoch": 0.88, "learning_rate": 5.653737373737375e-06, "loss": 0.3992, "step": 22025 }, { "epoch": 0.88, "learning_rate": 5.648686868686869e-06, "loss": 0.4173, "step": 22050 }, { "epoch": 0.89, "learning_rate": 5.643636363636364e-06, "loss": 0.4212, "step": 22075 }, { "epoch": 0.89, "learning_rate": 5.638585858585859e-06, "loss": 0.4066, "step": 22100 }, { "epoch": 0.89, "learning_rate": 5.633535353535355e-06, "loss": 0.4141, "step": 22125 }, { "epoch": 0.89, "learning_rate": 5.628484848484849e-06, "loss": 0.4004, "step": 22150 }, { "epoch": 0.89, "learning_rate": 5.623434343434344e-06, "loss": 0.4123, "step": 22175 }, { "epoch": 0.89, "learning_rate": 5.618383838383838e-06, "loss": 0.4064, "step": 22200 }, { "epoch": 0.89, "learning_rate": 5.613333333333334e-06, "loss": 0.4156, "step": 22225 }, { "epoch": 0.89, "learning_rate": 5.608282828282829e-06, "loss": 0.3922, "step": 22250 }, { "epoch": 0.89, "learning_rate": 5.603232323232324e-06, "loss": 0.4172, "step": 22275 }, { "epoch": 0.89, "learning_rate": 5.598181818181818e-06, "loss": 0.4073, "step": 22300 }, { "epoch": 0.9, "learning_rate": 5.593131313131313e-06, "loss": 0.3981, "step": 22325 }, { "epoch": 0.9, "learning_rate": 5.588080808080808e-06, "loss": 0.4175, "step": 22350 }, { "epoch": 0.9, "learning_rate": 5.5830303030303035e-06, "loss": 0.407, "step": 22375 }, { "epoch": 0.9, "learning_rate": 5.577979797979799e-06, "loss": 0.3995, "step": 22400 }, { "epoch": 0.9, "learning_rate": 5.572929292929293e-06, "loss": 0.4078, "step": 22425 }, { "epoch": 0.9, "learning_rate": 5.567878787878789e-06, "loss": 0.3822, "step": 22450 }, { "epoch": 0.9, "learning_rate": 5.562828282828283e-06, "loss": 0.4089, "step": 22475 }, { "epoch": 0.9, "learning_rate": 5.557777777777778e-06, "loss": 0.4163, "step": 22500 }, { "epoch": 0.9, "eval_loss": 0.41425320506095886, "eval_runtime": 313.671, "eval_samples_per_second": 15.956, "eval_steps_per_second": 1.996, "eval_wer": 32.542300481739005, "step": 22500 }, { "epoch": 0.9, "learning_rate": 5.552727272727273e-06, "loss": 0.4018, "step": 22525 }, { "epoch": 0.9, "learning_rate": 5.547676767676769e-06, "loss": 0.4308, "step": 22550 }, { "epoch": 0.91, "learning_rate": 5.542626262626263e-06, "loss": 0.4127, "step": 22575 }, { "epoch": 0.91, "learning_rate": 5.537575757575758e-06, "loss": 0.4111, "step": 22600 }, { "epoch": 0.91, "learning_rate": 5.532525252525252e-06, "loss": 0.4069, "step": 22625 }, { "epoch": 0.91, "learning_rate": 5.527474747474748e-06, "loss": 0.4216, "step": 22650 }, { "epoch": 0.91, "learning_rate": 5.522424242424243e-06, "loss": 0.3984, "step": 22675 }, { "epoch": 0.91, "learning_rate": 5.517373737373738e-06, "loss": 0.3949, "step": 22700 }, { "epoch": 0.91, "learning_rate": 5.512323232323232e-06, "loss": 0.3936, "step": 22725 }, { "epoch": 0.91, "learning_rate": 5.507272727272728e-06, "loss": 0.4118, "step": 22750 }, { "epoch": 0.91, "learning_rate": 5.5022222222222224e-06, "loss": 0.3797, "step": 22775 }, { "epoch": 0.91, "learning_rate": 5.497171717171718e-06, "loss": 0.4043, "step": 22800 }, { "epoch": 0.92, "learning_rate": 5.492323232323232e-06, "loss": 0.405, "step": 22825 }, { "epoch": 0.92, "learning_rate": 5.4872727272727275e-06, "loss": 0.3987, "step": 22850 }, { "epoch": 0.92, "learning_rate": 5.4822222222222235e-06, "loss": 0.4005, "step": 22875 }, { "epoch": 0.92, "learning_rate": 5.477171717171718e-06, "loss": 0.4014, "step": 22900 }, { "epoch": 0.92, "learning_rate": 5.472121212121213e-06, "loss": 0.4098, "step": 22925 }, { "epoch": 0.92, "learning_rate": 5.467070707070707e-06, "loss": 0.4111, "step": 22950 }, { "epoch": 0.92, "learning_rate": 5.462020202020203e-06, "loss": 0.4014, "step": 22975 }, { "epoch": 0.92, "learning_rate": 5.4569696969696975e-06, "loss": 0.4246, "step": 23000 }, { "epoch": 0.92, "learning_rate": 5.451919191919193e-06, "loss": 0.4103, "step": 23025 }, { "epoch": 0.92, "learning_rate": 5.446868686868687e-06, "loss": 0.3985, "step": 23050 }, { "epoch": 0.93, "learning_rate": 5.441818181818183e-06, "loss": 0.4221, "step": 23075 }, { "epoch": 0.93, "learning_rate": 5.436767676767677e-06, "loss": 0.4059, "step": 23100 }, { "epoch": 0.93, "learning_rate": 5.431717171717172e-06, "loss": 0.4058, "step": 23125 }, { "epoch": 0.93, "learning_rate": 5.426666666666667e-06, "loss": 0.41, "step": 23150 }, { "epoch": 0.93, "learning_rate": 5.421616161616162e-06, "loss": 0.4012, "step": 23175 }, { "epoch": 0.93, "learning_rate": 5.416565656565657e-06, "loss": 0.4175, "step": 23200 }, { "epoch": 0.93, "learning_rate": 5.411515151515152e-06, "loss": 0.3962, "step": 23225 }, { "epoch": 0.93, "learning_rate": 5.406464646464646e-06, "loss": 0.3994, "step": 23250 }, { "epoch": 0.93, "learning_rate": 5.4014141414141415e-06, "loss": 0.4042, "step": 23275 }, { "epoch": 0.93, "learning_rate": 5.3963636363636375e-06, "loss": 0.4133, "step": 23300 }, { "epoch": 0.94, "learning_rate": 5.391313131313132e-06, "loss": 0.3976, "step": 23325 }, { "epoch": 0.94, "learning_rate": 5.386262626262627e-06, "loss": 0.4217, "step": 23350 }, { "epoch": 0.94, "learning_rate": 5.381212121212121e-06, "loss": 0.4119, "step": 23375 }, { "epoch": 0.94, "learning_rate": 5.376161616161617e-06, "loss": 0.3959, "step": 23400 }, { "epoch": 0.94, "learning_rate": 5.3711111111111115e-06, "loss": 0.4011, "step": 23425 }, { "epoch": 0.94, "learning_rate": 5.366060606060607e-06, "loss": 0.4159, "step": 23450 }, { "epoch": 0.94, "learning_rate": 5.361010101010101e-06, "loss": 0.3831, "step": 23475 }, { "epoch": 0.94, "learning_rate": 5.355959595959597e-06, "loss": 0.4047, "step": 23500 }, { "epoch": 0.94, "learning_rate": 5.350909090909091e-06, "loss": 0.4134, "step": 23525 }, { "epoch": 0.94, "learning_rate": 5.345858585858586e-06, "loss": 0.4057, "step": 23550 }, { "epoch": 0.95, "learning_rate": 5.340808080808081e-06, "loss": 0.3774, "step": 23575 }, { "epoch": 0.95, "learning_rate": 5.335757575757577e-06, "loss": 0.385, "step": 23600 }, { "epoch": 0.95, "learning_rate": 5.330707070707071e-06, "loss": 0.4194, "step": 23625 }, { "epoch": 0.95, "learning_rate": 5.325656565656566e-06, "loss": 0.3963, "step": 23650 }, { "epoch": 0.95, "learning_rate": 5.3206060606060604e-06, "loss": 0.3942, "step": 23675 }, { "epoch": 0.95, "learning_rate": 5.3155555555555564e-06, "loss": 0.3933, "step": 23700 }, { "epoch": 0.95, "learning_rate": 5.310505050505051e-06, "loss": 0.3855, "step": 23725 }, { "epoch": 0.95, "learning_rate": 5.305454545454546e-06, "loss": 0.398, "step": 23750 }, { "epoch": 0.95, "learning_rate": 5.300404040404041e-06, "loss": 0.3858, "step": 23775 }, { "epoch": 0.95, "learning_rate": 5.295353535353535e-06, "loss": 0.4117, "step": 23800 }, { "epoch": 0.96, "learning_rate": 5.290303030303031e-06, "loss": 0.3883, "step": 23825 }, { "epoch": 0.96, "learning_rate": 5.285252525252526e-06, "loss": 0.4188, "step": 23850 }, { "epoch": 0.96, "learning_rate": 5.280202020202021e-06, "loss": 0.4152, "step": 23875 }, { "epoch": 0.96, "learning_rate": 5.275151515151515e-06, "loss": 0.417, "step": 23900 }, { "epoch": 0.96, "learning_rate": 5.270101010101011e-06, "loss": 0.3981, "step": 23925 }, { "epoch": 0.96, "learning_rate": 5.265050505050505e-06, "loss": 0.3862, "step": 23950 }, { "epoch": 0.96, "learning_rate": 5.2600000000000005e-06, "loss": 0.4005, "step": 23975 }, { "epoch": 0.96, "learning_rate": 5.254949494949495e-06, "loss": 0.3917, "step": 24000 }, { "epoch": 0.96, "learning_rate": 5.249898989898991e-06, "loss": 0.4012, "step": 24025 }, { "epoch": 0.96, "learning_rate": 5.244848484848485e-06, "loss": 0.4039, "step": 24050 }, { "epoch": 0.97, "learning_rate": 5.23979797979798e-06, "loss": 0.4166, "step": 24075 }, { "epoch": 0.97, "learning_rate": 5.2347474747474745e-06, "loss": 0.3985, "step": 24100 }, { "epoch": 0.97, "learning_rate": 5.2296969696969705e-06, "loss": 0.3946, "step": 24125 }, { "epoch": 0.97, "learning_rate": 5.224646464646465e-06, "loss": 0.4177, "step": 24150 }, { "epoch": 0.97, "learning_rate": 5.21959595959596e-06, "loss": 0.4052, "step": 24175 }, { "epoch": 0.97, "learning_rate": 5.214545454545455e-06, "loss": 0.4122, "step": 24200 }, { "epoch": 0.97, "learning_rate": 5.20949494949495e-06, "loss": 0.3905, "step": 24225 }, { "epoch": 0.97, "learning_rate": 5.204444444444445e-06, "loss": 0.4207, "step": 24250 }, { "epoch": 0.97, "learning_rate": 5.19939393939394e-06, "loss": 0.4138, "step": 24275 }, { "epoch": 0.97, "learning_rate": 5.194343434343435e-06, "loss": 0.3948, "step": 24300 }, { "epoch": 0.98, "learning_rate": 5.189292929292929e-06, "loss": 0.4039, "step": 24325 }, { "epoch": 0.98, "learning_rate": 5.184242424242425e-06, "loss": 0.3919, "step": 24350 }, { "epoch": 0.98, "learning_rate": 5.179191919191919e-06, "loss": 0.4047, "step": 24375 }, { "epoch": 0.98, "learning_rate": 5.1741414141414145e-06, "loss": 0.4308, "step": 24400 }, { "epoch": 0.98, "learning_rate": 5.169090909090909e-06, "loss": 0.3794, "step": 24425 }, { "epoch": 0.98, "learning_rate": 5.164040404040405e-06, "loss": 0.3918, "step": 24450 }, { "epoch": 0.98, "learning_rate": 5.158989898989899e-06, "loss": 0.4171, "step": 24475 }, { "epoch": 0.98, "learning_rate": 5.153939393939394e-06, "loss": 0.3838, "step": 24500 }, { "epoch": 0.98, "learning_rate": 5.1488888888888885e-06, "loss": 0.3948, "step": 24525 }, { "epoch": 0.98, "learning_rate": 5.1438383838383845e-06, "loss": 0.41, "step": 24550 }, { "epoch": 0.99, "learning_rate": 5.138787878787879e-06, "loss": 0.3874, "step": 24575 }, { "epoch": 0.99, "learning_rate": 5.133737373737374e-06, "loss": 0.3965, "step": 24600 }, { "epoch": 0.99, "learning_rate": 5.12868686868687e-06, "loss": 0.4062, "step": 24625 }, { "epoch": 0.99, "learning_rate": 5.123636363636364e-06, "loss": 0.4094, "step": 24650 }, { "epoch": 0.99, "learning_rate": 5.118585858585859e-06, "loss": 0.3903, "step": 24675 }, { "epoch": 0.99, "learning_rate": 5.113535353535354e-06, "loss": 0.3958, "step": 24700 }, { "epoch": 0.99, "learning_rate": 5.10848484848485e-06, "loss": 0.4025, "step": 24725 }, { "epoch": 0.99, "learning_rate": 5.103434343434344e-06, "loss": 0.4163, "step": 24750 }, { "epoch": 0.99, "learning_rate": 5.098383838383839e-06, "loss": 0.4031, "step": 24775 }, { "epoch": 0.99, "learning_rate": 5.093333333333333e-06, "loss": 0.3995, "step": 24800 }, { "epoch": 1.0, "learning_rate": 5.0882828282828286e-06, "loss": 0.404, "step": 24825 }, { "epoch": 1.0, "learning_rate": 5.083232323232324e-06, "loss": 0.3939, "step": 24850 }, { "epoch": 1.0, "learning_rate": 5.078181818181819e-06, "loss": 0.402, "step": 24875 }, { "epoch": 1.0, "learning_rate": 5.073131313131313e-06, "loss": 0.3975, "step": 24900 }, { "epoch": 1.0, "learning_rate": 5.068080808080808e-06, "loss": 0.3895, "step": 24925 }, { "epoch": 1.0, "learning_rate": 5.063030303030303e-06, "loss": 0.3973, "step": 24950 }, { "epoch": 1.0, "learning_rate": 5.0579797979797986e-06, "loss": 0.3876, "step": 24975 }, { "epoch": 1.0, "learning_rate": 5.052929292929293e-06, "loss": 0.3831, "step": 25000 }, { "epoch": 1.0, "eval_loss": 0.4076802432537079, "eval_runtime": 310.8735, "eval_samples_per_second": 16.1, "eval_steps_per_second": 2.014, "eval_wer": 31.695104297681482, "step": 25000 }, { "epoch": 1.0, "learning_rate": 5.047878787878788e-06, "loss": 0.3901, "step": 25025 }, { "epoch": 1.0, "learning_rate": 5.042828282828284e-06, "loss": 0.3626, "step": 25050 }, { "epoch": 1.01, "learning_rate": 5.037777777777778e-06, "loss": 0.4023, "step": 25075 }, { "epoch": 1.01, "learning_rate": 5.0327272727272734e-06, "loss": 0.3804, "step": 25100 }, { "epoch": 1.01, "learning_rate": 5.027676767676768e-06, "loss": 0.3772, "step": 25125 }, { "epoch": 1.01, "learning_rate": 5.022626262626264e-06, "loss": 0.3845, "step": 25150 }, { "epoch": 1.01, "learning_rate": 5.017575757575758e-06, "loss": 0.3764, "step": 25175 }, { "epoch": 1.01, "learning_rate": 5.012525252525253e-06, "loss": 0.38, "step": 25200 }, { "epoch": 1.01, "learning_rate": 5.0074747474747475e-06, "loss": 0.387, "step": 25225 }, { "epoch": 1.01, "learning_rate": 5.0024242424242435e-06, "loss": 0.3782, "step": 25250 }, { "epoch": 1.01, "learning_rate": 4.997373737373738e-06, "loss": 0.3734, "step": 25275 }, { "epoch": 1.01, "learning_rate": 4.992323232323233e-06, "loss": 0.4094, "step": 25300 }, { "epoch": 1.02, "learning_rate": 4.987272727272728e-06, "loss": 0.3939, "step": 25325 }, { "epoch": 1.02, "learning_rate": 4.982222222222222e-06, "loss": 0.3967, "step": 25350 }, { "epoch": 1.02, "learning_rate": 4.9771717171717175e-06, "loss": 0.3831, "step": 25375 }, { "epoch": 1.02, "learning_rate": 4.972121212121213e-06, "loss": 0.3657, "step": 25400 }, { "epoch": 1.02, "learning_rate": 4.967070707070708e-06, "loss": 0.3967, "step": 25425 }, { "epoch": 1.02, "learning_rate": 4.962020202020202e-06, "loss": 0.3957, "step": 25450 }, { "epoch": 1.02, "learning_rate": 4.956969696969697e-06, "loss": 0.3893, "step": 25475 }, { "epoch": 1.02, "learning_rate": 4.951919191919192e-06, "loss": 0.3874, "step": 25500 }, { "epoch": 1.02, "learning_rate": 4.9468686868686875e-06, "loss": 0.3782, "step": 25525 }, { "epoch": 1.02, "learning_rate": 4.941818181818182e-06, "loss": 0.3871, "step": 25550 }, { "epoch": 1.03, "learning_rate": 4.936767676767677e-06, "loss": 0.3951, "step": 25575 }, { "epoch": 1.03, "learning_rate": 4.931717171717172e-06, "loss": 0.3814, "step": 25600 }, { "epoch": 1.03, "learning_rate": 4.926666666666667e-06, "loss": 0.3715, "step": 25625 }, { "epoch": 1.03, "learning_rate": 4.921616161616162e-06, "loss": 0.3838, "step": 25650 }, { "epoch": 1.03, "learning_rate": 4.9165656565656575e-06, "loss": 0.3876, "step": 25675 }, { "epoch": 1.03, "learning_rate": 4.911515151515152e-06, "loss": 0.393, "step": 25700 }, { "epoch": 1.03, "learning_rate": 4.906464646464647e-06, "loss": 0.3932, "step": 25725 }, { "epoch": 1.03, "learning_rate": 4.901414141414142e-06, "loss": 0.3824, "step": 25750 }, { "epoch": 1.03, "learning_rate": 4.896363636363637e-06, "loss": 0.3721, "step": 25775 }, { "epoch": 1.03, "learning_rate": 4.8913131313131315e-06, "loss": 0.373, "step": 25800 }, { "epoch": 1.04, "learning_rate": 4.886262626262627e-06, "loss": 0.3911, "step": 25825 }, { "epoch": 1.04, "learning_rate": 4.881212121212122e-06, "loss": 0.375, "step": 25850 }, { "epoch": 1.04, "learning_rate": 4.876161616161617e-06, "loss": 0.3832, "step": 25875 }, { "epoch": 1.04, "learning_rate": 4.871111111111111e-06, "loss": 0.3944, "step": 25900 }, { "epoch": 1.04, "learning_rate": 4.866060606060606e-06, "loss": 0.3886, "step": 25925 }, { "epoch": 1.04, "learning_rate": 4.8610101010101015e-06, "loss": 0.3893, "step": 25950 }, { "epoch": 1.04, "learning_rate": 4.855959595959596e-06, "loss": 0.381, "step": 25975 }, { "epoch": 1.04, "learning_rate": 4.850909090909091e-06, "loss": 0.3811, "step": 26000 }, { "epoch": 1.04, "learning_rate": 4.845858585858586e-06, "loss": 0.3792, "step": 26025 }, { "epoch": 1.04, "learning_rate": 4.840808080808081e-06, "loss": 0.3789, "step": 26050 }, { "epoch": 1.05, "learning_rate": 4.835757575757576e-06, "loss": 0.3986, "step": 26075 }, { "epoch": 1.05, "learning_rate": 4.8307070707070715e-06, "loss": 0.3866, "step": 26100 }, { "epoch": 1.05, "learning_rate": 4.825656565656566e-06, "loss": 0.3888, "step": 26125 }, { "epoch": 1.05, "learning_rate": 4.820606060606061e-06, "loss": 0.3927, "step": 26150 }, { "epoch": 1.05, "learning_rate": 4.815555555555556e-06, "loss": 0.3709, "step": 26175 }, { "epoch": 1.05, "learning_rate": 4.810505050505051e-06, "loss": 0.3929, "step": 26200 }, { "epoch": 1.05, "learning_rate": 4.8054545454545456e-06, "loss": 0.3845, "step": 26225 }, { "epoch": 1.05, "learning_rate": 4.800404040404041e-06, "loss": 0.3757, "step": 26250 }, { "epoch": 1.05, "learning_rate": 4.795353535353536e-06, "loss": 0.3837, "step": 26275 }, { "epoch": 1.05, "learning_rate": 4.790303030303031e-06, "loss": 0.3939, "step": 26300 }, { "epoch": 1.06, "learning_rate": 4.785252525252525e-06, "loss": 0.3898, "step": 26325 }, { "epoch": 1.06, "learning_rate": 4.7802020202020204e-06, "loss": 0.377, "step": 26350 }, { "epoch": 1.06, "learning_rate": 4.775151515151516e-06, "loss": 0.3675, "step": 26375 }, { "epoch": 1.06, "learning_rate": 4.770101010101011e-06, "loss": 0.3781, "step": 26400 }, { "epoch": 1.06, "learning_rate": 4.765050505050505e-06, "loss": 0.3861, "step": 26425 }, { "epoch": 1.06, "learning_rate": 4.76e-06, "loss": 0.3626, "step": 26450 }, { "epoch": 1.06, "learning_rate": 4.754949494949495e-06, "loss": 0.3803, "step": 26475 }, { "epoch": 1.06, "learning_rate": 4.7498989898989905e-06, "loss": 0.3873, "step": 26500 }, { "epoch": 1.06, "learning_rate": 4.744848484848486e-06, "loss": 0.3894, "step": 26525 }, { "epoch": 1.06, "learning_rate": 4.739797979797981e-06, "loss": 0.3702, "step": 26550 }, { "epoch": 1.07, "learning_rate": 4.734747474747475e-06, "loss": 0.3703, "step": 26575 }, { "epoch": 1.07, "learning_rate": 4.72969696969697e-06, "loss": 0.3921, "step": 26600 }, { "epoch": 1.07, "learning_rate": 4.724646464646465e-06, "loss": 0.3711, "step": 26625 }, { "epoch": 1.07, "learning_rate": 4.7195959595959605e-06, "loss": 0.3698, "step": 26650 }, { "epoch": 1.07, "learning_rate": 4.714545454545455e-06, "loss": 0.4003, "step": 26675 }, { "epoch": 1.07, "learning_rate": 4.70949494949495e-06, "loss": 0.3753, "step": 26700 }, { "epoch": 1.07, "learning_rate": 4.704444444444445e-06, "loss": 0.3758, "step": 26725 }, { "epoch": 1.07, "learning_rate": 4.699393939393939e-06, "loss": 0.3859, "step": 26750 }, { "epoch": 1.07, "learning_rate": 4.6943434343434345e-06, "loss": 0.3941, "step": 26775 }, { "epoch": 1.07, "learning_rate": 4.68929292929293e-06, "loss": 0.3668, "step": 26800 }, { "epoch": 1.08, "learning_rate": 4.684444444444444e-06, "loss": 0.372, "step": 26825 }, { "epoch": 1.08, "learning_rate": 4.67959595959596e-06, "loss": 0.3784, "step": 26850 }, { "epoch": 1.08, "learning_rate": 4.674545454545455e-06, "loss": 0.3788, "step": 26875 }, { "epoch": 1.08, "learning_rate": 4.6694949494949494e-06, "loss": 0.3934, "step": 26900 }, { "epoch": 1.08, "learning_rate": 4.664444444444445e-06, "loss": 0.3674, "step": 26925 }, { "epoch": 1.08, "learning_rate": 4.65939393939394e-06, "loss": 0.3955, "step": 26950 }, { "epoch": 1.08, "learning_rate": 4.654343434343435e-06, "loss": 0.3911, "step": 26975 }, { "epoch": 1.08, "learning_rate": 4.649292929292929e-06, "loss": 0.377, "step": 27000 }, { "epoch": 1.08, "learning_rate": 4.644242424242424e-06, "loss": 0.3726, "step": 27025 }, { "epoch": 1.08, "learning_rate": 4.6391919191919195e-06, "loss": 0.3804, "step": 27050 }, { "epoch": 1.09, "learning_rate": 4.634141414141415e-06, "loss": 0.3942, "step": 27075 }, { "epoch": 1.09, "learning_rate": 4.62909090909091e-06, "loss": 0.4027, "step": 27100 }, { "epoch": 1.09, "learning_rate": 4.624040404040405e-06, "loss": 0.3764, "step": 27125 }, { "epoch": 1.09, "learning_rate": 4.618989898989899e-06, "loss": 0.3919, "step": 27150 }, { "epoch": 1.09, "learning_rate": 4.613939393939394e-06, "loss": 0.3839, "step": 27175 }, { "epoch": 1.09, "learning_rate": 4.6088888888888895e-06, "loss": 0.3623, "step": 27200 }, { "epoch": 1.09, "learning_rate": 4.603838383838385e-06, "loss": 0.3779, "step": 27225 }, { "epoch": 1.09, "learning_rate": 4.598787878787879e-06, "loss": 0.3885, "step": 27250 }, { "epoch": 1.09, "learning_rate": 4.593737373737374e-06, "loss": 0.3758, "step": 27275 }, { "epoch": 1.09, "learning_rate": 4.588686868686869e-06, "loss": 0.3776, "step": 27300 }, { "epoch": 1.1, "learning_rate": 4.583636363636364e-06, "loss": 0.401, "step": 27325 }, { "epoch": 1.1, "learning_rate": 4.578585858585859e-06, "loss": 0.3718, "step": 27350 }, { "epoch": 1.1, "learning_rate": 4.573535353535354e-06, "loss": 0.3863, "step": 27375 }, { "epoch": 1.1, "learning_rate": 4.568484848484849e-06, "loss": 0.3867, "step": 27400 }, { "epoch": 1.1, "learning_rate": 4.563434343434344e-06, "loss": 0.367, "step": 27425 }, { "epoch": 1.1, "learning_rate": 4.558383838383838e-06, "loss": 0.3986, "step": 27450 }, { "epoch": 1.1, "learning_rate": 4.5533333333333335e-06, "loss": 0.3798, "step": 27475 }, { "epoch": 1.1, "learning_rate": 4.548282828282829e-06, "loss": 0.3842, "step": 27500 }, { "epoch": 1.1, "eval_loss": 0.4022856056690216, "eval_runtime": 322.6887, "eval_samples_per_second": 15.51, "eval_steps_per_second": 1.94, "eval_wer": 33.63155271838439, "step": 27500 }, { "epoch": 1.1, "learning_rate": 4.543232323232323e-06, "loss": 0.361, "step": 27525 }, { "epoch": 1.1, "learning_rate": 4.538181818181819e-06, "loss": 0.3699, "step": 27550 }, { "epoch": 1.11, "learning_rate": 4.533131313131314e-06, "loss": 0.3763, "step": 27575 }, { "epoch": 1.11, "learning_rate": 4.528080808080808e-06, "loss": 0.371, "step": 27600 }, { "epoch": 1.11, "learning_rate": 4.5230303030303035e-06, "loss": 0.3696, "step": 27625 }, { "epoch": 1.11, "learning_rate": 4.517979797979799e-06, "loss": 0.3897, "step": 27650 }, { "epoch": 1.11, "learning_rate": 4.512929292929294e-06, "loss": 0.3757, "step": 27675 }, { "epoch": 1.11, "learning_rate": 4.507878787878788e-06, "loss": 0.3852, "step": 27700 }, { "epoch": 1.11, "learning_rate": 4.502828282828283e-06, "loss": 0.3945, "step": 27725 }, { "epoch": 1.11, "learning_rate": 4.497777777777778e-06, "loss": 0.3839, "step": 27750 }, { "epoch": 1.11, "learning_rate": 4.492727272727273e-06, "loss": 0.3827, "step": 27775 }, { "epoch": 1.11, "learning_rate": 4.487676767676768e-06, "loss": 0.3886, "step": 27800 }, { "epoch": 1.12, "learning_rate": 4.482626262626263e-06, "loss": 0.3664, "step": 27825 }, { "epoch": 1.12, "learning_rate": 4.477575757575758e-06, "loss": 0.3928, "step": 27850 }, { "epoch": 1.12, "learning_rate": 4.472525252525252e-06, "loss": 0.3776, "step": 27875 }, { "epoch": 1.12, "learning_rate": 4.4674747474747475e-06, "loss": 0.3925, "step": 27900 }, { "epoch": 1.12, "learning_rate": 4.462424242424243e-06, "loss": 0.3815, "step": 27925 }, { "epoch": 1.12, "learning_rate": 4.457373737373738e-06, "loss": 0.3881, "step": 27950 }, { "epoch": 1.12, "learning_rate": 4.452323232323233e-06, "loss": 0.3703, "step": 27975 }, { "epoch": 1.12, "learning_rate": 4.447272727272728e-06, "loss": 0.3955, "step": 28000 }, { "epoch": 1.12, "learning_rate": 4.442222222222222e-06, "loss": 0.3786, "step": 28025 }, { "epoch": 1.12, "learning_rate": 4.4371717171717176e-06, "loss": 0.4067, "step": 28050 }, { "epoch": 1.13, "learning_rate": 4.432121212121213e-06, "loss": 0.3632, "step": 28075 }, { "epoch": 1.13, "learning_rate": 4.427070707070708e-06, "loss": 0.381, "step": 28100 }, { "epoch": 1.13, "learning_rate": 4.422020202020202e-06, "loss": 0.3744, "step": 28125 }, { "epoch": 1.13, "learning_rate": 4.416969696969697e-06, "loss": 0.3843, "step": 28150 }, { "epoch": 1.13, "learning_rate": 4.4119191919191924e-06, "loss": 0.3729, "step": 28175 }, { "epoch": 1.13, "learning_rate": 4.4068686868686876e-06, "loss": 0.3548, "step": 28200 }, { "epoch": 1.13, "learning_rate": 4.401818181818182e-06, "loss": 0.3733, "step": 28225 }, { "epoch": 1.13, "learning_rate": 4.396767676767677e-06, "loss": 0.3919, "step": 28250 }, { "epoch": 1.13, "learning_rate": 4.391717171717172e-06, "loss": 0.3762, "step": 28275 }, { "epoch": 1.13, "learning_rate": 4.3866666666666665e-06, "loss": 0.3767, "step": 28300 }, { "epoch": 1.14, "learning_rate": 4.381616161616162e-06, "loss": 0.3704, "step": 28325 }, { "epoch": 1.14, "learning_rate": 4.376565656565657e-06, "loss": 0.3963, "step": 28350 }, { "epoch": 1.14, "learning_rate": 4.371515151515152e-06, "loss": 0.3824, "step": 28375 }, { "epoch": 1.14, "learning_rate": 4.366464646464647e-06, "loss": 0.3832, "step": 28400 }, { "epoch": 1.14, "learning_rate": 4.361414141414142e-06, "loss": 0.366, "step": 28425 }, { "epoch": 1.14, "learning_rate": 4.356363636363637e-06, "loss": 0.377, "step": 28450 }, { "epoch": 1.14, "learning_rate": 4.351313131313132e-06, "loss": 0.3651, "step": 28475 }, { "epoch": 1.14, "learning_rate": 4.346262626262627e-06, "loss": 0.3938, "step": 28500 }, { "epoch": 1.14, "learning_rate": 4.341212121212122e-06, "loss": 0.3796, "step": 28525 }, { "epoch": 1.14, "learning_rate": 4.336161616161616e-06, "loss": 0.3877, "step": 28550 }, { "epoch": 1.15, "learning_rate": 4.331111111111111e-06, "loss": 0.3801, "step": 28575 }, { "epoch": 1.15, "learning_rate": 4.3260606060606065e-06, "loss": 0.3907, "step": 28600 }, { "epoch": 1.15, "learning_rate": 4.321010101010102e-06, "loss": 0.3832, "step": 28625 }, { "epoch": 1.15, "learning_rate": 4.315959595959596e-06, "loss": 0.3799, "step": 28650 }, { "epoch": 1.15, "learning_rate": 4.310909090909091e-06, "loss": 0.3825, "step": 28675 }, { "epoch": 1.15, "learning_rate": 4.305858585858586e-06, "loss": 0.3681, "step": 28700 }, { "epoch": 1.15, "learning_rate": 4.300808080808081e-06, "loss": 0.3675, "step": 28725 }, { "epoch": 1.15, "learning_rate": 4.295757575757576e-06, "loss": 0.3728, "step": 28750 }, { "epoch": 1.15, "learning_rate": 4.290707070707071e-06, "loss": 0.3684, "step": 28775 }, { "epoch": 1.15, "learning_rate": 4.285656565656566e-06, "loss": 0.3687, "step": 28800 }, { "epoch": 1.16, "learning_rate": 4.280606060606061e-06, "loss": 0.365, "step": 28825 }, { "epoch": 1.16, "learning_rate": 4.275555555555556e-06, "loss": 0.3874, "step": 28850 }, { "epoch": 1.16, "learning_rate": 4.270505050505051e-06, "loss": 0.3783, "step": 28875 }, { "epoch": 1.16, "learning_rate": 4.265454545454546e-06, "loss": 0.3832, "step": 28900 }, { "epoch": 1.16, "learning_rate": 4.260404040404041e-06, "loss": 0.3815, "step": 28925 }, { "epoch": 1.16, "learning_rate": 4.255353535353536e-06, "loss": 0.3875, "step": 28950 }, { "epoch": 1.16, "learning_rate": 4.250303030303031e-06, "loss": 0.3624, "step": 28975 }, { "epoch": 1.16, "learning_rate": 4.245252525252525e-06, "loss": 0.3646, "step": 29000 }, { "epoch": 1.16, "learning_rate": 4.2402020202020205e-06, "loss": 0.3803, "step": 29025 }, { "epoch": 1.16, "learning_rate": 4.235151515151516e-06, "loss": 0.3728, "step": 29050 }, { "epoch": 1.17, "learning_rate": 4.23010101010101e-06, "loss": 0.3881, "step": 29075 }, { "epoch": 1.17, "learning_rate": 4.225050505050505e-06, "loss": 0.375, "step": 29100 }, { "epoch": 1.17, "learning_rate": 4.22e-06, "loss": 0.3652, "step": 29125 }, { "epoch": 1.17, "learning_rate": 4.214949494949495e-06, "loss": 0.384, "step": 29150 }, { "epoch": 1.17, "learning_rate": 4.20989898989899e-06, "loss": 0.3605, "step": 29175 }, { "epoch": 1.17, "learning_rate": 4.204848484848485e-06, "loss": 0.3659, "step": 29200 }, { "epoch": 1.17, "learning_rate": 4.19979797979798e-06, "loss": 0.3696, "step": 29225 }, { "epoch": 1.17, "learning_rate": 4.194747474747475e-06, "loss": 0.3855, "step": 29250 }, { "epoch": 1.17, "learning_rate": 4.18969696969697e-06, "loss": 0.3844, "step": 29275 }, { "epoch": 1.17, "learning_rate": 4.184646464646465e-06, "loss": 0.363, "step": 29300 }, { "epoch": 1.18, "learning_rate": 4.17959595959596e-06, "loss": 0.376, "step": 29325 }, { "epoch": 1.18, "learning_rate": 4.174545454545455e-06, "loss": 0.3875, "step": 29350 }, { "epoch": 1.18, "learning_rate": 4.16949494949495e-06, "loss": 0.3933, "step": 29375 }, { "epoch": 1.18, "learning_rate": 4.164444444444445e-06, "loss": 0.3746, "step": 29400 }, { "epoch": 1.18, "learning_rate": 4.1593939393939394e-06, "loss": 0.3743, "step": 29425 }, { "epoch": 1.18, "learning_rate": 4.1543434343434346e-06, "loss": 0.3803, "step": 29450 }, { "epoch": 1.18, "learning_rate": 4.14929292929293e-06, "loss": 0.3782, "step": 29475 }, { "epoch": 1.18, "learning_rate": 4.144242424242425e-06, "loss": 0.3827, "step": 29500 }, { "epoch": 1.18, "learning_rate": 4.139191919191919e-06, "loss": 0.3827, "step": 29525 }, { "epoch": 1.18, "learning_rate": 4.134141414141414e-06, "loss": 0.3686, "step": 29550 }, { "epoch": 1.19, "learning_rate": 4.1290909090909094e-06, "loss": 0.3547, "step": 29575 }, { "epoch": 1.19, "learning_rate": 4.124040404040405e-06, "loss": 0.3831, "step": 29600 }, { "epoch": 1.19, "learning_rate": 4.118989898989899e-06, "loss": 0.374, "step": 29625 }, { "epoch": 1.19, "learning_rate": 4.113939393939394e-06, "loss": 0.3723, "step": 29650 }, { "epoch": 1.19, "learning_rate": 4.108888888888889e-06, "loss": 0.3813, "step": 29675 }, { "epoch": 1.19, "learning_rate": 4.103838383838384e-06, "loss": 0.382, "step": 29700 }, { "epoch": 1.19, "learning_rate": 4.0987878787878795e-06, "loss": 0.3801, "step": 29725 }, { "epoch": 1.19, "learning_rate": 4.093737373737375e-06, "loss": 0.3686, "step": 29750 }, { "epoch": 1.19, "learning_rate": 4.088686868686869e-06, "loss": 0.3743, "step": 29775 }, { "epoch": 1.19, "learning_rate": 4.083636363636364e-06, "loss": 0.3665, "step": 29800 }, { "epoch": 1.2, "learning_rate": 4.078585858585859e-06, "loss": 0.3657, "step": 29825 }, { "epoch": 1.2, "learning_rate": 4.0735353535353535e-06, "loss": 0.3683, "step": 29850 }, { "epoch": 1.2, "learning_rate": 4.068484848484849e-06, "loss": 0.3697, "step": 29875 }, { "epoch": 1.2, "learning_rate": 4.063434343434344e-06, "loss": 0.387, "step": 29900 }, { "epoch": 1.2, "learning_rate": 4.058383838383839e-06, "loss": 0.3793, "step": 29925 }, { "epoch": 1.2, "learning_rate": 4.053333333333333e-06, "loss": 0.3765, "step": 29950 }, { "epoch": 1.2, "learning_rate": 4.048282828282828e-06, "loss": 0.3854, "step": 29975 }, { "epoch": 1.2, "learning_rate": 4.0432323232323235e-06, "loss": 0.3848, "step": 30000 }, { "epoch": 1.2, "eval_loss": 0.3984352946281433, "eval_runtime": 321.4637, "eval_samples_per_second": 15.569, "eval_steps_per_second": 1.947, "eval_wer": 30.10987446308645, "step": 30000 }, { "epoch": 1.2, "learning_rate": 4.038181818181819e-06, "loss": 0.3611, "step": 30025 }, { "epoch": 1.2, "learning_rate": 4.033131313131313e-06, "loss": 0.3679, "step": 30050 }, { "epoch": 1.21, "learning_rate": 4.028080808080808e-06, "loss": 0.3871, "step": 30075 }, { "epoch": 1.21, "learning_rate": 4.023030303030303e-06, "loss": 0.37, "step": 30100 }, { "epoch": 1.21, "learning_rate": 4.017979797979798e-06, "loss": 0.3907, "step": 30125 }, { "epoch": 1.21, "learning_rate": 4.0129292929292935e-06, "loss": 0.3855, "step": 30150 }, { "epoch": 1.21, "learning_rate": 4.007878787878789e-06, "loss": 0.3823, "step": 30175 }, { "epoch": 1.21, "learning_rate": 4.002828282828283e-06, "loss": 0.3737, "step": 30200 }, { "epoch": 1.21, "learning_rate": 3.997777777777778e-06, "loss": 0.3771, "step": 30225 }, { "epoch": 1.21, "learning_rate": 3.992727272727273e-06, "loss": 0.3616, "step": 30250 }, { "epoch": 1.21, "learning_rate": 3.987676767676768e-06, "loss": 0.3891, "step": 30275 }, { "epoch": 1.22, "learning_rate": 3.982626262626263e-06, "loss": 0.3803, "step": 30300 }, { "epoch": 1.22, "learning_rate": 3.977575757575758e-06, "loss": 0.3833, "step": 30325 }, { "epoch": 1.22, "learning_rate": 3.972525252525253e-06, "loss": 0.3839, "step": 30350 }, { "epoch": 1.22, "learning_rate": 3.967474747474748e-06, "loss": 0.3631, "step": 30375 }, { "epoch": 1.22, "learning_rate": 3.962424242424242e-06, "loss": 0.3719, "step": 30400 }, { "epoch": 1.22, "learning_rate": 3.9573737373737375e-06, "loss": 0.369, "step": 30425 }, { "epoch": 1.22, "learning_rate": 3.952323232323233e-06, "loss": 0.3953, "step": 30450 }, { "epoch": 1.22, "learning_rate": 3.947272727272727e-06, "loss": 0.3675, "step": 30475 }, { "epoch": 1.22, "learning_rate": 3.942222222222222e-06, "loss": 0.3801, "step": 30500 }, { "epoch": 1.22, "learning_rate": 3.937171717171718e-06, "loss": 0.3821, "step": 30525 }, { "epoch": 1.23, "learning_rate": 3.932121212121212e-06, "loss": 0.377, "step": 30550 }, { "epoch": 1.23, "learning_rate": 3.9270707070707076e-06, "loss": 0.3815, "step": 30575 }, { "epoch": 1.23, "learning_rate": 3.922020202020203e-06, "loss": 0.3986, "step": 30600 }, { "epoch": 1.23, "learning_rate": 3.916969696969698e-06, "loss": 0.3857, "step": 30625 }, { "epoch": 1.23, "learning_rate": 3.911919191919192e-06, "loss": 0.3729, "step": 30650 }, { "epoch": 1.23, "learning_rate": 3.906868686868687e-06, "loss": 0.365, "step": 30675 }, { "epoch": 1.23, "learning_rate": 3.901818181818182e-06, "loss": 0.3761, "step": 30700 }, { "epoch": 1.23, "learning_rate": 3.896767676767677e-06, "loss": 0.3843, "step": 30725 }, { "epoch": 1.23, "learning_rate": 3.891717171717172e-06, "loss": 0.3866, "step": 30750 }, { "epoch": 1.23, "learning_rate": 3.886666666666667e-06, "loss": 0.3839, "step": 30775 }, { "epoch": 1.24, "learning_rate": 3.881616161616162e-06, "loss": 0.3657, "step": 30800 }, { "epoch": 1.24, "learning_rate": 3.8765656565656564e-06, "loss": 0.3783, "step": 30825 }, { "epoch": 1.24, "learning_rate": 3.871515151515152e-06, "loss": 0.3709, "step": 30850 }, { "epoch": 1.24, "learning_rate": 3.866666666666667e-06, "loss": 0.3716, "step": 30875 }, { "epoch": 1.24, "learning_rate": 3.8616161616161615e-06, "loss": 0.3539, "step": 30900 }, { "epoch": 1.24, "learning_rate": 3.856565656565657e-06, "loss": 0.3722, "step": 30925 }, { "epoch": 1.24, "learning_rate": 3.851515151515152e-06, "loss": 0.3756, "step": 30950 }, { "epoch": 1.24, "learning_rate": 3.846464646464647e-06, "loss": 0.3721, "step": 30975 }, { "epoch": 1.24, "learning_rate": 3.841414141414141e-06, "loss": 0.3652, "step": 31000 }, { "epoch": 1.24, "learning_rate": 3.836363636363636e-06, "loss": 0.3591, "step": 31025 }, { "epoch": 1.25, "learning_rate": 3.8313131313131315e-06, "loss": 0.3523, "step": 31050 }, { "epoch": 1.25, "learning_rate": 3.826262626262627e-06, "loss": 0.3621, "step": 31075 }, { "epoch": 1.25, "learning_rate": 3.821212121212122e-06, "loss": 0.3723, "step": 31100 }, { "epoch": 1.25, "learning_rate": 3.816161616161617e-06, "loss": 0.408, "step": 31125 }, { "epoch": 1.25, "learning_rate": 3.8111111111111117e-06, "loss": 0.3633, "step": 31150 }, { "epoch": 1.25, "learning_rate": 3.8060606060606064e-06, "loss": 0.3777, "step": 31175 }, { "epoch": 1.25, "learning_rate": 3.8010101010101015e-06, "loss": 0.3545, "step": 31200 }, { "epoch": 1.25, "learning_rate": 3.7959595959595962e-06, "loss": 0.3702, "step": 31225 }, { "epoch": 1.25, "learning_rate": 3.7909090909090914e-06, "loss": 0.3834, "step": 31250 }, { "epoch": 1.25, "learning_rate": 3.785858585858586e-06, "loss": 0.3783, "step": 31275 }, { "epoch": 1.26, "learning_rate": 3.7808080808080812e-06, "loss": 0.3867, "step": 31300 }, { "epoch": 1.26, "learning_rate": 3.775757575757576e-06, "loss": 0.3957, "step": 31325 }, { "epoch": 1.26, "learning_rate": 3.7707070707070707e-06, "loss": 0.3978, "step": 31350 }, { "epoch": 1.26, "learning_rate": 3.765656565656566e-06, "loss": 0.3811, "step": 31375 }, { "epoch": 1.26, "learning_rate": 3.7606060606060605e-06, "loss": 0.3783, "step": 31400 }, { "epoch": 1.26, "learning_rate": 3.7555555555555557e-06, "loss": 0.376, "step": 31425 }, { "epoch": 1.26, "learning_rate": 3.7505050505050504e-06, "loss": 0.4037, "step": 31450 }, { "epoch": 1.26, "learning_rate": 3.745454545454546e-06, "loss": 0.3646, "step": 31475 }, { "epoch": 1.26, "learning_rate": 3.740404040404041e-06, "loss": 0.3956, "step": 31500 }, { "epoch": 1.26, "learning_rate": 3.735353535353536e-06, "loss": 0.3631, "step": 31525 }, { "epoch": 1.27, "learning_rate": 3.7303030303030306e-06, "loss": 0.3911, "step": 31550 }, { "epoch": 1.27, "learning_rate": 3.7252525252525257e-06, "loss": 0.3575, "step": 31575 }, { "epoch": 1.27, "learning_rate": 3.7202020202020204e-06, "loss": 0.3684, "step": 31600 }, { "epoch": 1.27, "learning_rate": 3.7151515151515156e-06, "loss": 0.3883, "step": 31625 }, { "epoch": 1.27, "learning_rate": 3.7103030303030308e-06, "loss": 0.3612, "step": 31650 }, { "epoch": 1.27, "learning_rate": 3.7052525252525255e-06, "loss": 0.3719, "step": 31675 }, { "epoch": 1.27, "learning_rate": 3.7002020202020206e-06, "loss": 0.3751, "step": 31700 }, { "epoch": 1.27, "learning_rate": 3.6951515151515153e-06, "loss": 0.3733, "step": 31725 }, { "epoch": 1.27, "learning_rate": 3.6901010101010105e-06, "loss": 0.3703, "step": 31750 }, { "epoch": 1.27, "learning_rate": 3.685050505050505e-06, "loss": 0.3749, "step": 31775 }, { "epoch": 1.28, "learning_rate": 3.6800000000000003e-06, "loss": 0.3645, "step": 31800 }, { "epoch": 1.28, "learning_rate": 3.674949494949495e-06, "loss": 0.3783, "step": 31825 }, { "epoch": 1.28, "learning_rate": 3.66989898989899e-06, "loss": 0.3761, "step": 31850 }, { "epoch": 1.28, "learning_rate": 3.664848484848485e-06, "loss": 0.3799, "step": 31875 }, { "epoch": 1.28, "learning_rate": 3.65979797979798e-06, "loss": 0.3971, "step": 31900 }, { "epoch": 1.28, "learning_rate": 3.6547474747474748e-06, "loss": 0.3596, "step": 31925 }, { "epoch": 1.28, "learning_rate": 3.64969696969697e-06, "loss": 0.3811, "step": 31950 }, { "epoch": 1.28, "learning_rate": 3.644646464646465e-06, "loss": 0.3619, "step": 31975 }, { "epoch": 1.28, "learning_rate": 3.6395959595959602e-06, "loss": 0.3776, "step": 32000 }, { "epoch": 1.28, "learning_rate": 3.634545454545455e-06, "loss": 0.3886, "step": 32025 }, { "epoch": 1.29, "learning_rate": 3.62949494949495e-06, "loss": 0.3691, "step": 32050 }, { "epoch": 1.29, "learning_rate": 3.624444444444445e-06, "loss": 0.3774, "step": 32075 }, { "epoch": 1.29, "learning_rate": 3.61939393939394e-06, "loss": 0.3706, "step": 32100 }, { "epoch": 1.29, "learning_rate": 3.6143434343434347e-06, "loss": 0.3684, "step": 32125 }, { "epoch": 1.29, "learning_rate": 3.60929292929293e-06, "loss": 0.3787, "step": 32150 }, { "epoch": 1.29, "learning_rate": 3.6042424242424245e-06, "loss": 0.3814, "step": 32175 }, { "epoch": 1.29, "learning_rate": 3.5991919191919197e-06, "loss": 0.3632, "step": 32200 }, { "epoch": 1.29, "learning_rate": 3.5941414141414144e-06, "loss": 0.3616, "step": 32225 }, { "epoch": 1.29, "learning_rate": 3.589090909090909e-06, "loss": 0.3776, "step": 32250 }, { "epoch": 1.29, "learning_rate": 3.5840404040404043e-06, "loss": 0.3877, "step": 32275 }, { "epoch": 1.3, "learning_rate": 3.578989898989899e-06, "loss": 0.3801, "step": 32300 }, { "epoch": 1.3, "learning_rate": 3.573939393939394e-06, "loss": 0.38, "step": 32325 }, { "epoch": 1.3, "learning_rate": 3.568888888888889e-06, "loss": 0.3855, "step": 32350 }, { "epoch": 1.3, "learning_rate": 3.563838383838384e-06, "loss": 0.3809, "step": 32375 }, { "epoch": 1.3, "learning_rate": 3.5587878787878795e-06, "loss": 0.3729, "step": 32400 }, { "epoch": 1.3, "learning_rate": 3.5537373737373743e-06, "loss": 0.3869, "step": 32425 }, { "epoch": 1.3, "learning_rate": 3.548686868686869e-06, "loss": 0.373, "step": 32450 }, { "epoch": 1.3, "learning_rate": 3.543636363636364e-06, "loss": 0.3739, "step": 32475 }, { "epoch": 1.3, "learning_rate": 3.538585858585859e-06, "loss": 0.3774, "step": 32500 }, { "epoch": 1.3, "eval_loss": 0.39484164118766785, "eval_runtime": 316.8768, "eval_samples_per_second": 15.795, "eval_steps_per_second": 1.976, "eval_wer": 29.286409264576758, "step": 32500 }, { "epoch": 1.3, "learning_rate": 3.533535353535354e-06, "loss": 0.3763, "step": 32525 }, { "epoch": 1.31, "learning_rate": 3.5284848484848487e-06, "loss": 0.3612, "step": 32550 }, { "epoch": 1.31, "learning_rate": 3.523434343434344e-06, "loss": 0.3716, "step": 32575 }, { "epoch": 1.31, "learning_rate": 3.5183838383838386e-06, "loss": 0.3837, "step": 32600 }, { "epoch": 1.31, "learning_rate": 3.5133333333333337e-06, "loss": 0.3732, "step": 32625 }, { "epoch": 1.31, "learning_rate": 3.5082828282828284e-06, "loss": 0.3579, "step": 32650 }, { "epoch": 1.31, "learning_rate": 3.5032323232323236e-06, "loss": 0.3632, "step": 32675 }, { "epoch": 1.31, "learning_rate": 3.4981818181818183e-06, "loss": 0.3622, "step": 32700 }, { "epoch": 1.31, "learning_rate": 3.4931313131313134e-06, "loss": 0.372, "step": 32725 }, { "epoch": 1.31, "learning_rate": 3.488080808080808e-06, "loss": 0.3654, "step": 32750 }, { "epoch": 1.31, "learning_rate": 3.483030303030303e-06, "loss": 0.3585, "step": 32775 }, { "epoch": 1.32, "learning_rate": 3.477979797979798e-06, "loss": 0.3741, "step": 32800 }, { "epoch": 1.32, "learning_rate": 3.4729292929292936e-06, "loss": 0.3837, "step": 32825 }, { "epoch": 1.32, "learning_rate": 3.4678787878787883e-06, "loss": 0.3789, "step": 32850 }, { "epoch": 1.32, "learning_rate": 3.4628282828282835e-06, "loss": 0.3655, "step": 32875 }, { "epoch": 1.32, "learning_rate": 3.457777777777778e-06, "loss": 0.3971, "step": 32900 }, { "epoch": 1.32, "learning_rate": 3.4527272727272733e-06, "loss": 0.3546, "step": 32925 }, { "epoch": 1.32, "learning_rate": 3.447676767676768e-06, "loss": 0.3669, "step": 32950 }, { "epoch": 1.32, "learning_rate": 3.442626262626263e-06, "loss": 0.3724, "step": 32975 }, { "epoch": 1.32, "learning_rate": 3.437575757575758e-06, "loss": 0.3663, "step": 33000 }, { "epoch": 1.32, "learning_rate": 3.4325252525252526e-06, "loss": 0.3658, "step": 33025 }, { "epoch": 1.33, "learning_rate": 3.4274747474747478e-06, "loss": 0.3767, "step": 33050 }, { "epoch": 1.33, "learning_rate": 3.4224242424242425e-06, "loss": 0.3873, "step": 33075 }, { "epoch": 1.33, "learning_rate": 3.4173737373737376e-06, "loss": 0.3811, "step": 33100 }, { "epoch": 1.33, "learning_rate": 3.4123232323232323e-06, "loss": 0.3642, "step": 33125 }, { "epoch": 1.33, "learning_rate": 3.4072727272727275e-06, "loss": 0.3857, "step": 33150 }, { "epoch": 1.33, "learning_rate": 3.4022222222222222e-06, "loss": 0.3699, "step": 33175 }, { "epoch": 1.33, "learning_rate": 3.3971717171717174e-06, "loss": 0.3551, "step": 33200 }, { "epoch": 1.33, "learning_rate": 3.392121212121212e-06, "loss": 0.3643, "step": 33225 }, { "epoch": 1.33, "learning_rate": 3.3870707070707076e-06, "loss": 0.3619, "step": 33250 }, { "epoch": 1.33, "learning_rate": 3.3820202020202024e-06, "loss": 0.3629, "step": 33275 }, { "epoch": 1.34, "learning_rate": 3.3769696969696975e-06, "loss": 0.3771, "step": 33300 }, { "epoch": 1.34, "learning_rate": 3.3719191919191922e-06, "loss": 0.3686, "step": 33325 }, { "epoch": 1.34, "learning_rate": 3.3668686868686874e-06, "loss": 0.384, "step": 33350 }, { "epoch": 1.34, "learning_rate": 3.361818181818182e-06, "loss": 0.3782, "step": 33375 }, { "epoch": 1.34, "learning_rate": 3.3567676767676772e-06, "loss": 0.3908, "step": 33400 }, { "epoch": 1.34, "learning_rate": 3.351717171717172e-06, "loss": 0.3656, "step": 33425 }, { "epoch": 1.34, "learning_rate": 3.346666666666667e-06, "loss": 0.3744, "step": 33450 }, { "epoch": 1.34, "learning_rate": 3.341616161616162e-06, "loss": 0.3734, "step": 33475 }, { "epoch": 1.34, "learning_rate": 3.336565656565657e-06, "loss": 0.3818, "step": 33500 }, { "epoch": 1.34, "learning_rate": 3.3315151515151517e-06, "loss": 0.357, "step": 33525 }, { "epoch": 1.35, "learning_rate": 3.326464646464647e-06, "loss": 0.3672, "step": 33550 }, { "epoch": 1.35, "learning_rate": 3.3214141414141415e-06, "loss": 0.3844, "step": 33575 }, { "epoch": 1.35, "learning_rate": 3.3163636363636363e-06, "loss": 0.3595, "step": 33600 }, { "epoch": 1.35, "learning_rate": 3.3113131313131314e-06, "loss": 0.3811, "step": 33625 }, { "epoch": 1.35, "learning_rate": 3.306262626262626e-06, "loss": 0.3512, "step": 33650 }, { "epoch": 1.35, "learning_rate": 3.3012121212121217e-06, "loss": 0.379, "step": 33675 }, { "epoch": 1.35, "learning_rate": 3.296161616161617e-06, "loss": 0.3905, "step": 33700 }, { "epoch": 1.35, "learning_rate": 3.2911111111111116e-06, "loss": 0.3655, "step": 33725 }, { "epoch": 1.35, "learning_rate": 3.2860606060606067e-06, "loss": 0.3791, "step": 33750 }, { "epoch": 1.35, "learning_rate": 3.2810101010101014e-06, "loss": 0.3635, "step": 33775 }, { "epoch": 1.36, "learning_rate": 3.275959595959596e-06, "loss": 0.3685, "step": 33800 }, { "epoch": 1.36, "learning_rate": 3.2709090909090913e-06, "loss": 0.3658, "step": 33825 }, { "epoch": 1.36, "learning_rate": 3.265858585858586e-06, "loss": 0.3813, "step": 33850 }, { "epoch": 1.36, "learning_rate": 3.260808080808081e-06, "loss": 0.3697, "step": 33875 }, { "epoch": 1.36, "learning_rate": 3.255757575757576e-06, "loss": 0.3699, "step": 33900 }, { "epoch": 1.36, "learning_rate": 3.250707070707071e-06, "loss": 0.3908, "step": 33925 }, { "epoch": 1.36, "learning_rate": 3.2456565656565657e-06, "loss": 0.3789, "step": 33950 }, { "epoch": 1.36, "learning_rate": 3.240606060606061e-06, "loss": 0.3673, "step": 33975 }, { "epoch": 1.36, "learning_rate": 3.2355555555555556e-06, "loss": 0.3746, "step": 34000 }, { "epoch": 1.36, "learning_rate": 3.2305050505050507e-06, "loss": 0.3683, "step": 34025 }, { "epoch": 1.37, "learning_rate": 3.2254545454545455e-06, "loss": 0.3722, "step": 34050 }, { "epoch": 1.37, "learning_rate": 3.2204040404040406e-06, "loss": 0.3844, "step": 34075 }, { "epoch": 1.37, "learning_rate": 3.2153535353535357e-06, "loss": 0.3661, "step": 34100 }, { "epoch": 1.37, "learning_rate": 3.210303030303031e-06, "loss": 0.3803, "step": 34125 }, { "epoch": 1.37, "learning_rate": 3.2052525252525256e-06, "loss": 0.3847, "step": 34150 }, { "epoch": 1.37, "learning_rate": 3.2002020202020207e-06, "loss": 0.3853, "step": 34175 }, { "epoch": 1.37, "learning_rate": 3.1951515151515155e-06, "loss": 0.3683, "step": 34200 }, { "epoch": 1.37, "learning_rate": 3.1901010101010106e-06, "loss": 0.379, "step": 34225 }, { "epoch": 1.37, "learning_rate": 3.1850505050505053e-06, "loss": 0.3779, "step": 34250 }, { "epoch": 1.37, "learning_rate": 3.1800000000000005e-06, "loss": 0.3689, "step": 34275 }, { "epoch": 1.38, "learning_rate": 3.174949494949495e-06, "loss": 0.3779, "step": 34300 }, { "epoch": 1.38, "learning_rate": 3.1698989898989903e-06, "loss": 0.3603, "step": 34325 }, { "epoch": 1.38, "learning_rate": 3.164848484848485e-06, "loss": 0.3832, "step": 34350 }, { "epoch": 1.38, "learning_rate": 3.1597979797979798e-06, "loss": 0.3902, "step": 34375 }, { "epoch": 1.38, "learning_rate": 3.154747474747475e-06, "loss": 0.37, "step": 34400 }, { "epoch": 1.38, "learning_rate": 3.1496969696969696e-06, "loss": 0.3629, "step": 34425 }, { "epoch": 1.38, "learning_rate": 3.1446464646464648e-06, "loss": 0.3733, "step": 34450 }, { "epoch": 1.38, "learning_rate": 3.1395959595959595e-06, "loss": 0.3633, "step": 34475 }, { "epoch": 1.38, "learning_rate": 3.1345454545454546e-06, "loss": 0.3804, "step": 34500 }, { "epoch": 1.38, "learning_rate": 3.1294949494949494e-06, "loss": 0.3715, "step": 34525 }, { "epoch": 1.39, "learning_rate": 3.124444444444445e-06, "loss": 0.3571, "step": 34550 }, { "epoch": 1.39, "learning_rate": 3.11939393939394e-06, "loss": 0.3838, "step": 34575 }, { "epoch": 1.39, "learning_rate": 3.114343434343435e-06, "loss": 0.3638, "step": 34600 }, { "epoch": 1.39, "learning_rate": 3.1092929292929295e-06, "loss": 0.3643, "step": 34625 }, { "epoch": 1.39, "learning_rate": 3.1042424242424247e-06, "loss": 0.3621, "step": 34650 }, { "epoch": 1.39, "learning_rate": 3.0991919191919194e-06, "loss": 0.3687, "step": 34675 }, { "epoch": 1.39, "learning_rate": 3.0941414141414145e-06, "loss": 0.3607, "step": 34700 }, { "epoch": 1.39, "learning_rate": 3.0890909090909092e-06, "loss": 0.3902, "step": 34725 }, { "epoch": 1.39, "learning_rate": 3.0840404040404044e-06, "loss": 0.3709, "step": 34750 }, { "epoch": 1.39, "learning_rate": 3.078989898989899e-06, "loss": 0.3906, "step": 34775 }, { "epoch": 1.4, "learning_rate": 3.0739393939393942e-06, "loss": 0.3538, "step": 34800 }, { "epoch": 1.4, "learning_rate": 3.068888888888889e-06, "loss": 0.3618, "step": 34825 }, { "epoch": 1.4, "learning_rate": 3.063838383838384e-06, "loss": 0.3723, "step": 34850 }, { "epoch": 1.4, "learning_rate": 3.058787878787879e-06, "loss": 0.3607, "step": 34875 }, { "epoch": 1.4, "learning_rate": 3.053737373737374e-06, "loss": 0.363, "step": 34900 }, { "epoch": 1.4, "learning_rate": 3.0486868686868687e-06, "loss": 0.3426, "step": 34925 }, { "epoch": 1.4, "learning_rate": 3.0436363636363634e-06, "loss": 0.3637, "step": 34950 }, { "epoch": 1.4, "learning_rate": 3.038585858585859e-06, "loss": 0.3681, "step": 34975 }, { "epoch": 1.4, "learning_rate": 3.033535353535354e-06, "loss": 0.3667, "step": 35000 }, { "epoch": 1.4, "eval_loss": 0.3912336826324463, "eval_runtime": 305.76, "eval_samples_per_second": 16.369, "eval_steps_per_second": 2.047, "eval_wer": 29.516599824390706, "step": 35000 }, { "epoch": 1.4, "learning_rate": 3.028484848484849e-06, "loss": 0.371, "step": 35025 }, { "epoch": 1.41, "learning_rate": 3.023434343434344e-06, "loss": 0.3572, "step": 35050 }, { "epoch": 1.41, "learning_rate": 3.0183838383838387e-06, "loss": 0.3677, "step": 35075 }, { "epoch": 1.41, "learning_rate": 3.013333333333334e-06, "loss": 0.3687, "step": 35100 }, { "epoch": 1.41, "learning_rate": 3.0082828282828286e-06, "loss": 0.3723, "step": 35125 }, { "epoch": 1.41, "learning_rate": 3.0032323232323237e-06, "loss": 0.3641, "step": 35150 }, { "epoch": 1.41, "learning_rate": 2.9981818181818184e-06, "loss": 0.3574, "step": 35175 }, { "epoch": 1.41, "learning_rate": 2.993131313131313e-06, "loss": 0.3686, "step": 35200 }, { "epoch": 1.41, "learning_rate": 2.9880808080808083e-06, "loss": 0.3802, "step": 35225 }, { "epoch": 1.41, "learning_rate": 2.983030303030303e-06, "loss": 0.3695, "step": 35250 }, { "epoch": 1.41, "learning_rate": 2.977979797979798e-06, "loss": 0.3799, "step": 35275 }, { "epoch": 1.42, "learning_rate": 2.972929292929293e-06, "loss": 0.3693, "step": 35300 }, { "epoch": 1.42, "learning_rate": 2.967878787878788e-06, "loss": 0.3745, "step": 35325 }, { "epoch": 1.42, "learning_rate": 2.9628282828282827e-06, "loss": 0.3884, "step": 35350 }, { "epoch": 1.42, "learning_rate": 2.957777777777778e-06, "loss": 0.3866, "step": 35375 }, { "epoch": 1.42, "learning_rate": 2.952727272727273e-06, "loss": 0.3682, "step": 35400 }, { "epoch": 1.42, "learning_rate": 2.947676767676768e-06, "loss": 0.3848, "step": 35425 }, { "epoch": 1.42, "learning_rate": 2.942626262626263e-06, "loss": 0.3718, "step": 35450 }, { "epoch": 1.42, "learning_rate": 2.937575757575758e-06, "loss": 0.3725, "step": 35475 }, { "epoch": 1.42, "learning_rate": 2.9325252525252528e-06, "loss": 0.3892, "step": 35500 }, { "epoch": 1.42, "learning_rate": 2.927474747474748e-06, "loss": 0.3646, "step": 35525 }, { "epoch": 1.43, "learning_rate": 2.9224242424242426e-06, "loss": 0.3628, "step": 35550 }, { "epoch": 1.43, "learning_rate": 2.9173737373737378e-06, "loss": 0.3609, "step": 35575 }, { "epoch": 1.43, "learning_rate": 2.9123232323232325e-06, "loss": 0.3547, "step": 35600 }, { "epoch": 1.43, "learning_rate": 2.9072727272727276e-06, "loss": 0.3778, "step": 35625 }, { "epoch": 1.43, "learning_rate": 2.9022222222222223e-06, "loss": 0.3585, "step": 35650 }, { "epoch": 1.43, "learning_rate": 2.8973737373737375e-06, "loss": 0.369, "step": 35675 }, { "epoch": 1.43, "learning_rate": 2.8923232323232327e-06, "loss": 0.3617, "step": 35700 }, { "epoch": 1.43, "learning_rate": 2.8872727272727274e-06, "loss": 0.3639, "step": 35725 }, { "epoch": 1.43, "learning_rate": 2.8822222222222225e-06, "loss": 0.3638, "step": 35750 }, { "epoch": 1.43, "learning_rate": 2.8771717171717173e-06, "loss": 0.3639, "step": 35775 }, { "epoch": 1.44, "learning_rate": 2.8721212121212124e-06, "loss": 0.3808, "step": 35800 }, { "epoch": 1.44, "learning_rate": 2.867070707070707e-06, "loss": 0.375, "step": 35825 }, { "epoch": 1.44, "learning_rate": 2.862020202020202e-06, "loss": 0.3533, "step": 35850 }, { "epoch": 1.44, "learning_rate": 2.856969696969697e-06, "loss": 0.3687, "step": 35875 }, { "epoch": 1.44, "learning_rate": 2.8519191919191925e-06, "loss": 0.3734, "step": 35900 }, { "epoch": 1.44, "learning_rate": 2.8468686868686873e-06, "loss": 0.3532, "step": 35925 }, { "epoch": 1.44, "learning_rate": 2.8418181818181824e-06, "loss": 0.3764, "step": 35950 }, { "epoch": 1.44, "learning_rate": 2.836767676767677e-06, "loss": 0.3668, "step": 35975 }, { "epoch": 1.44, "learning_rate": 2.8317171717171723e-06, "loss": 0.3666, "step": 36000 }, { "epoch": 1.44, "learning_rate": 2.826666666666667e-06, "loss": 0.3726, "step": 36025 }, { "epoch": 1.45, "learning_rate": 2.8216161616161617e-06, "loss": 0.3732, "step": 36050 }, { "epoch": 1.45, "learning_rate": 2.816565656565657e-06, "loss": 0.3792, "step": 36075 }, { "epoch": 1.45, "learning_rate": 2.8115151515151516e-06, "loss": 0.3611, "step": 36100 }, { "epoch": 1.45, "learning_rate": 2.8064646464646467e-06, "loss": 0.3788, "step": 36125 }, { "epoch": 1.45, "learning_rate": 2.8014141414141414e-06, "loss": 0.3708, "step": 36150 }, { "epoch": 1.45, "learning_rate": 2.7963636363636366e-06, "loss": 0.3748, "step": 36175 }, { "epoch": 1.45, "learning_rate": 2.7913131313131313e-06, "loss": 0.3703, "step": 36200 }, { "epoch": 1.45, "learning_rate": 2.7862626262626264e-06, "loss": 0.3886, "step": 36225 }, { "epoch": 1.45, "learning_rate": 2.781212121212121e-06, "loss": 0.3808, "step": 36250 }, { "epoch": 1.45, "learning_rate": 2.7761616161616163e-06, "loss": 0.3718, "step": 36275 }, { "epoch": 1.46, "learning_rate": 2.771111111111111e-06, "loss": 0.3705, "step": 36300 }, { "epoch": 1.46, "learning_rate": 2.7660606060606066e-06, "loss": 0.3652, "step": 36325 }, { "epoch": 1.46, "learning_rate": 2.7610101010101013e-06, "loss": 0.3868, "step": 36350 }, { "epoch": 1.46, "learning_rate": 2.7559595959595965e-06, "loss": 0.3726, "step": 36375 }, { "epoch": 1.46, "learning_rate": 2.750909090909091e-06, "loss": 0.3618, "step": 36400 }, { "epoch": 1.46, "learning_rate": 2.7458585858585863e-06, "loss": 0.3691, "step": 36425 }, { "epoch": 1.46, "learning_rate": 2.740808080808081e-06, "loss": 0.3828, "step": 36450 }, { "epoch": 1.46, "learning_rate": 2.735757575757576e-06, "loss": 0.3493, "step": 36475 }, { "epoch": 1.46, "learning_rate": 2.730707070707071e-06, "loss": 0.3479, "step": 36500 }, { "epoch": 1.46, "learning_rate": 2.725656565656566e-06, "loss": 0.3757, "step": 36525 }, { "epoch": 1.47, "learning_rate": 2.7206060606060608e-06, "loss": 0.382, "step": 36550 }, { "epoch": 1.47, "learning_rate": 2.715555555555556e-06, "loss": 0.3821, "step": 36575 }, { "epoch": 1.47, "learning_rate": 2.7105050505050506e-06, "loss": 0.3745, "step": 36600 }, { "epoch": 1.47, "learning_rate": 2.7054545454545453e-06, "loss": 0.3865, "step": 36625 }, { "epoch": 1.47, "learning_rate": 2.7004040404040405e-06, "loss": 0.3973, "step": 36650 }, { "epoch": 1.47, "learning_rate": 2.695353535353535e-06, "loss": 0.3608, "step": 36675 }, { "epoch": 1.47, "learning_rate": 2.6903030303030304e-06, "loss": 0.3895, "step": 36700 }, { "epoch": 1.47, "learning_rate": 2.685252525252525e-06, "loss": 0.3636, "step": 36725 }, { "epoch": 1.47, "learning_rate": 2.6802020202020206e-06, "loss": 0.3612, "step": 36750 }, { "epoch": 1.47, "learning_rate": 2.6751515151515158e-06, "loss": 0.3774, "step": 36775 }, { "epoch": 1.48, "learning_rate": 2.6701010101010105e-06, "loss": 0.3648, "step": 36800 }, { "epoch": 1.48, "learning_rate": 2.6650505050505056e-06, "loss": 0.3923, "step": 36825 }, { "epoch": 1.48, "learning_rate": 2.6600000000000004e-06, "loss": 0.3753, "step": 36850 }, { "epoch": 1.48, "learning_rate": 2.654949494949495e-06, "loss": 0.359, "step": 36875 }, { "epoch": 1.48, "learning_rate": 2.6498989898989902e-06, "loss": 0.3599, "step": 36900 }, { "epoch": 1.48, "learning_rate": 2.644848484848485e-06, "loss": 0.3582, "step": 36925 }, { "epoch": 1.48, "learning_rate": 2.63979797979798e-06, "loss": 0.377, "step": 36950 }, { "epoch": 1.48, "learning_rate": 2.634747474747475e-06, "loss": 0.3565, "step": 36975 }, { "epoch": 1.48, "learning_rate": 2.62969696969697e-06, "loss": 0.3517, "step": 37000 }, { "epoch": 1.48, "learning_rate": 2.6246464646464647e-06, "loss": 0.3668, "step": 37025 }, { "epoch": 1.49, "learning_rate": 2.61959595959596e-06, "loss": 0.3779, "step": 37050 }, { "epoch": 1.49, "learning_rate": 2.6145454545454545e-06, "loss": 0.3635, "step": 37075 }, { "epoch": 1.49, "learning_rate": 2.6094949494949497e-06, "loss": 0.3662, "step": 37100 }, { "epoch": 1.49, "learning_rate": 2.6044444444444444e-06, "loss": 0.3695, "step": 37125 }, { "epoch": 1.49, "learning_rate": 2.5993939393939395e-06, "loss": 0.3585, "step": 37150 }, { "epoch": 1.49, "learning_rate": 2.5943434343434347e-06, "loss": 0.3716, "step": 37175 }, { "epoch": 1.49, "learning_rate": 2.58929292929293e-06, "loss": 0.3694, "step": 37200 }, { "epoch": 1.49, "learning_rate": 2.5842424242424246e-06, "loss": 0.3676, "step": 37225 }, { "epoch": 1.49, "learning_rate": 2.5791919191919197e-06, "loss": 0.3785, "step": 37250 }, { "epoch": 1.49, "learning_rate": 2.5741414141414144e-06, "loss": 0.3505, "step": 37275 }, { "epoch": 1.5, "learning_rate": 2.5690909090909096e-06, "loss": 0.3643, "step": 37300 }, { "epoch": 1.5, "learning_rate": 2.5640404040404043e-06, "loss": 0.3612, "step": 37325 }, { "epoch": 1.5, "learning_rate": 2.5589898989898994e-06, "loss": 0.3833, "step": 37350 }, { "epoch": 1.5, "learning_rate": 2.553939393939394e-06, "loss": 0.3497, "step": 37375 }, { "epoch": 1.5, "learning_rate": 2.5488888888888893e-06, "loss": 0.358, "step": 37400 }, { "epoch": 1.5, "learning_rate": 2.543838383838384e-06, "loss": 0.3683, "step": 37425 }, { "epoch": 1.5, "learning_rate": 2.5387878787878787e-06, "loss": 0.3678, "step": 37450 }, { "epoch": 1.5, "learning_rate": 2.533737373737374e-06, "loss": 0.367, "step": 37475 }, { "epoch": 1.5, "learning_rate": 2.5286868686868686e-06, "loss": 0.3674, "step": 37500 }, { "epoch": 1.5, "eval_loss": 0.3881114423274994, "eval_runtime": 315.0434, "eval_samples_per_second": 15.887, "eval_steps_per_second": 1.987, "eval_wer": 29.611523766582025, "step": 37500 }, { "epoch": 1.5, "learning_rate": 2.5236363636363637e-06, "loss": 0.3705, "step": 37525 }, { "epoch": 1.51, "learning_rate": 2.5185858585858584e-06, "loss": 0.3774, "step": 37550 }, { "epoch": 1.51, "learning_rate": 2.5135353535353536e-06, "loss": 0.3828, "step": 37575 }, { "epoch": 1.51, "learning_rate": 2.508484848484849e-06, "loss": 0.3841, "step": 37600 }, { "epoch": 1.51, "learning_rate": 2.503434343434344e-06, "loss": 0.365, "step": 37625 }, { "epoch": 1.51, "learning_rate": 2.4983838383838386e-06, "loss": 0.3662, "step": 37650 }, { "epoch": 1.51, "learning_rate": 2.4935353535353538e-06, "loss": 0.3612, "step": 37675 }, { "epoch": 1.51, "learning_rate": 2.4884848484848485e-06, "loss": 0.3737, "step": 37700 }, { "epoch": 1.51, "learning_rate": 2.4834343434343436e-06, "loss": 0.3698, "step": 37725 }, { "epoch": 1.51, "learning_rate": 2.4783838383838384e-06, "loss": 0.3605, "step": 37750 }, { "epoch": 1.51, "learning_rate": 2.4733333333333335e-06, "loss": 0.3811, "step": 37775 }, { "epoch": 1.52, "learning_rate": 2.4682828282828287e-06, "loss": 0.3475, "step": 37800 }, { "epoch": 1.52, "learning_rate": 2.4632323232323234e-06, "loss": 0.384, "step": 37825 }, { "epoch": 1.52, "learning_rate": 2.4581818181818185e-06, "loss": 0.3673, "step": 37850 }, { "epoch": 1.52, "learning_rate": 2.4531313131313132e-06, "loss": 0.3607, "step": 37875 }, { "epoch": 1.52, "learning_rate": 2.4480808080808084e-06, "loss": 0.3692, "step": 37900 }, { "epoch": 1.52, "learning_rate": 2.443030303030303e-06, "loss": 0.3598, "step": 37925 }, { "epoch": 1.52, "learning_rate": 2.4379797979797982e-06, "loss": 0.375, "step": 37950 }, { "epoch": 1.52, "learning_rate": 2.432929292929293e-06, "loss": 0.3648, "step": 37975 }, { "epoch": 1.52, "learning_rate": 2.427878787878788e-06, "loss": 0.371, "step": 38000 }, { "epoch": 1.52, "learning_rate": 2.4228282828282832e-06, "loss": 0.3652, "step": 38025 }, { "epoch": 1.53, "learning_rate": 2.417777777777778e-06, "loss": 0.366, "step": 38050 }, { "epoch": 1.53, "learning_rate": 2.412727272727273e-06, "loss": 0.3743, "step": 38075 }, { "epoch": 1.53, "learning_rate": 2.407676767676768e-06, "loss": 0.3759, "step": 38100 }, { "epoch": 1.53, "learning_rate": 2.402626262626263e-06, "loss": 0.3602, "step": 38125 }, { "epoch": 1.53, "learning_rate": 2.3975757575757577e-06, "loss": 0.3499, "step": 38150 }, { "epoch": 1.53, "learning_rate": 2.392525252525253e-06, "loss": 0.379, "step": 38175 }, { "epoch": 1.53, "learning_rate": 2.3874747474747476e-06, "loss": 0.3714, "step": 38200 }, { "epoch": 1.53, "learning_rate": 2.3824242424242427e-06, "loss": 0.3651, "step": 38225 }, { "epoch": 1.53, "learning_rate": 2.377373737373738e-06, "loss": 0.3924, "step": 38250 }, { "epoch": 1.53, "learning_rate": 2.3723232323232326e-06, "loss": 0.3603, "step": 38275 }, { "epoch": 1.54, "learning_rate": 2.3672727272727277e-06, "loss": 0.3641, "step": 38300 }, { "epoch": 1.54, "learning_rate": 2.3622222222222224e-06, "loss": 0.3601, "step": 38325 }, { "epoch": 1.54, "learning_rate": 2.357171717171717e-06, "loss": 0.3579, "step": 38350 }, { "epoch": 1.54, "learning_rate": 2.3521212121212123e-06, "loss": 0.3695, "step": 38375 }, { "epoch": 1.54, "learning_rate": 2.347070707070707e-06, "loss": 0.3897, "step": 38400 }, { "epoch": 1.54, "learning_rate": 2.342020202020202e-06, "loss": 0.3636, "step": 38425 }, { "epoch": 1.54, "learning_rate": 2.3369696969696973e-06, "loss": 0.3608, "step": 38450 }, { "epoch": 1.54, "learning_rate": 2.331919191919192e-06, "loss": 0.3822, "step": 38475 }, { "epoch": 1.54, "learning_rate": 2.326868686868687e-06, "loss": 0.3553, "step": 38500 }, { "epoch": 1.54, "learning_rate": 2.321818181818182e-06, "loss": 0.3531, "step": 38525 }, { "epoch": 1.55, "learning_rate": 2.316767676767677e-06, "loss": 0.3777, "step": 38550 }, { "epoch": 1.55, "learning_rate": 2.3117171717171717e-06, "loss": 0.3587, "step": 38575 }, { "epoch": 1.55, "learning_rate": 2.306666666666667e-06, "loss": 0.351, "step": 38600 }, { "epoch": 1.55, "learning_rate": 2.3016161616161616e-06, "loss": 0.3717, "step": 38625 }, { "epoch": 1.55, "learning_rate": 2.2965656565656568e-06, "loss": 0.3726, "step": 38650 }, { "epoch": 1.55, "learning_rate": 2.291515151515152e-06, "loss": 0.3658, "step": 38675 }, { "epoch": 1.55, "learning_rate": 2.2864646464646466e-06, "loss": 0.3675, "step": 38700 }, { "epoch": 1.55, "learning_rate": 2.2814141414141418e-06, "loss": 0.3596, "step": 38725 }, { "epoch": 1.55, "learning_rate": 2.2763636363636365e-06, "loss": 0.3791, "step": 38750 }, { "epoch": 1.55, "learning_rate": 2.2713131313131316e-06, "loss": 0.3683, "step": 38775 }, { "epoch": 1.56, "learning_rate": 2.2662626262626263e-06, "loss": 0.3827, "step": 38800 }, { "epoch": 1.56, "learning_rate": 2.2612121212121215e-06, "loss": 0.3748, "step": 38825 }, { "epoch": 1.56, "learning_rate": 2.256161616161616e-06, "loss": 0.371, "step": 38850 }, { "epoch": 1.56, "learning_rate": 2.2511111111111113e-06, "loss": 0.3624, "step": 38875 }, { "epoch": 1.56, "learning_rate": 2.2460606060606065e-06, "loss": 0.3662, "step": 38900 }, { "epoch": 1.56, "learning_rate": 2.241010101010101e-06, "loss": 0.3618, "step": 38925 }, { "epoch": 1.56, "learning_rate": 2.2359595959595964e-06, "loss": 0.366, "step": 38950 }, { "epoch": 1.56, "learning_rate": 2.230909090909091e-06, "loss": 0.3647, "step": 38975 }, { "epoch": 1.56, "learning_rate": 2.225858585858586e-06, "loss": 0.3719, "step": 39000 }, { "epoch": 1.56, "learning_rate": 2.220808080808081e-06, "loss": 0.3861, "step": 39025 }, { "epoch": 1.57, "learning_rate": 2.2157575757575757e-06, "loss": 0.374, "step": 39050 }, { "epoch": 1.57, "learning_rate": 2.2107070707070712e-06, "loss": 0.3668, "step": 39075 }, { "epoch": 1.57, "learning_rate": 2.205656565656566e-06, "loss": 0.3666, "step": 39100 }, { "epoch": 1.57, "learning_rate": 2.2006060606060607e-06, "loss": 0.3709, "step": 39125 }, { "epoch": 1.57, "learning_rate": 2.195555555555556e-06, "loss": 0.3439, "step": 39150 }, { "epoch": 1.57, "learning_rate": 2.1905050505050505e-06, "loss": 0.3771, "step": 39175 }, { "epoch": 1.57, "learning_rate": 2.1854545454545457e-06, "loss": 0.3647, "step": 39200 }, { "epoch": 1.57, "learning_rate": 2.1804040404040404e-06, "loss": 0.3765, "step": 39225 }, { "epoch": 1.57, "learning_rate": 2.1753535353535355e-06, "loss": 0.3626, "step": 39250 }, { "epoch": 1.57, "learning_rate": 2.1703030303030303e-06, "loss": 0.3637, "step": 39275 }, { "epoch": 1.58, "learning_rate": 2.1652525252525254e-06, "loss": 0.351, "step": 39300 }, { "epoch": 1.58, "learning_rate": 2.1602020202020205e-06, "loss": 0.3615, "step": 39325 }, { "epoch": 1.58, "learning_rate": 2.1551515151515153e-06, "loss": 0.361, "step": 39350 }, { "epoch": 1.58, "learning_rate": 2.1501010101010104e-06, "loss": 0.349, "step": 39375 }, { "epoch": 1.58, "learning_rate": 2.145050505050505e-06, "loss": 0.3675, "step": 39400 }, { "epoch": 1.58, "learning_rate": 2.1400000000000003e-06, "loss": 0.3569, "step": 39425 }, { "epoch": 1.58, "learning_rate": 2.134949494949495e-06, "loss": 0.347, "step": 39450 }, { "epoch": 1.58, "learning_rate": 2.12989898989899e-06, "loss": 0.3669, "step": 39475 }, { "epoch": 1.58, "learning_rate": 2.1248484848484853e-06, "loss": 0.3688, "step": 39500 }, { "epoch": 1.58, "learning_rate": 2.11979797979798e-06, "loss": 0.3631, "step": 39525 }, { "epoch": 1.59, "learning_rate": 2.114747474747475e-06, "loss": 0.3549, "step": 39550 }, { "epoch": 1.59, "learning_rate": 2.10969696969697e-06, "loss": 0.3504, "step": 39575 }, { "epoch": 1.59, "learning_rate": 2.104646464646465e-06, "loss": 0.3579, "step": 39600 }, { "epoch": 1.59, "learning_rate": 2.0995959595959597e-06, "loss": 0.3856, "step": 39625 }, { "epoch": 1.59, "learning_rate": 2.094545454545455e-06, "loss": 0.3729, "step": 39650 }, { "epoch": 1.59, "learning_rate": 2.0894949494949496e-06, "loss": 0.3809, "step": 39675 }, { "epoch": 1.59, "learning_rate": 2.0846464646464648e-06, "loss": 0.3682, "step": 39700 }, { "epoch": 1.59, "learning_rate": 2.07959595959596e-06, "loss": 0.3707, "step": 39725 }, { "epoch": 1.59, "learning_rate": 2.0745454545454546e-06, "loss": 0.35, "step": 39750 }, { "epoch": 1.59, "learning_rate": 2.0694949494949493e-06, "loss": 0.3763, "step": 39775 }, { "epoch": 1.6, "learning_rate": 2.064444444444445e-06, "loss": 0.3857, "step": 39800 }, { "epoch": 1.6, "learning_rate": 2.0593939393939396e-06, "loss": 0.3519, "step": 39825 }, { "epoch": 1.6, "learning_rate": 2.0543434343434348e-06, "loss": 0.3685, "step": 39850 }, { "epoch": 1.6, "learning_rate": 2.0492929292929295e-06, "loss": 0.3894, "step": 39875 }, { "epoch": 1.6, "learning_rate": 2.0442424242424242e-06, "loss": 0.3639, "step": 39900 }, { "epoch": 1.6, "learning_rate": 2.0391919191919194e-06, "loss": 0.3852, "step": 39925 }, { "epoch": 1.6, "learning_rate": 2.034141414141414e-06, "loss": 0.3704, "step": 39950 }, { "epoch": 1.6, "learning_rate": 2.0290909090909092e-06, "loss": 0.3497, "step": 39975 }, { "epoch": 1.6, "learning_rate": 2.024040404040404e-06, "loss": 0.3721, "step": 40000 }, { "epoch": 1.6, "eval_loss": 0.38509780168533325, "eval_runtime": 317.4006, "eval_samples_per_second": 15.769, "eval_steps_per_second": 1.972, "eval_wer": 30.406511782434325, "step": 40000 }, { "epoch": 1.6, "learning_rate": 2.018989898989899e-06, "loss": 0.3682, "step": 40025 }, { "epoch": 1.61, "learning_rate": 2.0139393939393942e-06, "loss": 0.3679, "step": 40050 }, { "epoch": 1.61, "learning_rate": 2.008888888888889e-06, "loss": 0.3719, "step": 40075 }, { "epoch": 1.61, "learning_rate": 2.003838383838384e-06, "loss": 0.3647, "step": 40100 }, { "epoch": 1.61, "learning_rate": 1.998787878787879e-06, "loss": 0.3515, "step": 40125 }, { "epoch": 1.61, "learning_rate": 1.993737373737374e-06, "loss": 0.3651, "step": 40150 }, { "epoch": 1.61, "learning_rate": 1.9886868686868687e-06, "loss": 0.3716, "step": 40175 }, { "epoch": 1.61, "learning_rate": 1.983636363636364e-06, "loss": 0.3559, "step": 40200 }, { "epoch": 1.61, "learning_rate": 1.9785858585858585e-06, "loss": 0.3673, "step": 40225 }, { "epoch": 1.61, "learning_rate": 1.9735353535353537e-06, "loss": 0.3724, "step": 40250 }, { "epoch": 1.62, "learning_rate": 1.968484848484849e-06, "loss": 0.3587, "step": 40275 }, { "epoch": 1.62, "learning_rate": 1.9634343434343435e-06, "loss": 0.3762, "step": 40300 }, { "epoch": 1.62, "learning_rate": 1.9583838383838387e-06, "loss": 0.3616, "step": 40325 }, { "epoch": 1.62, "learning_rate": 1.9533333333333334e-06, "loss": 0.3605, "step": 40350 }, { "epoch": 1.62, "learning_rate": 1.9482828282828286e-06, "loss": 0.3805, "step": 40375 }, { "epoch": 1.62, "learning_rate": 1.9432323232323233e-06, "loss": 0.3777, "step": 40400 }, { "epoch": 1.62, "learning_rate": 1.9381818181818184e-06, "loss": 0.3648, "step": 40425 }, { "epoch": 1.62, "learning_rate": 1.9331313131313136e-06, "loss": 0.3803, "step": 40450 }, { "epoch": 1.62, "learning_rate": 1.9280808080808083e-06, "loss": 0.3942, "step": 40475 }, { "epoch": 1.62, "learning_rate": 1.9230303030303034e-06, "loss": 0.3739, "step": 40500 }, { "epoch": 1.63, "learning_rate": 1.917979797979798e-06, "loss": 0.3552, "step": 40525 }, { "epoch": 1.63, "learning_rate": 1.9129292929292933e-06, "loss": 0.367, "step": 40550 }, { "epoch": 1.63, "learning_rate": 1.907878787878788e-06, "loss": 0.3621, "step": 40575 }, { "epoch": 1.63, "learning_rate": 1.902828282828283e-06, "loss": 0.3791, "step": 40600 }, { "epoch": 1.63, "learning_rate": 1.8977777777777779e-06, "loss": 0.3655, "step": 40625 }, { "epoch": 1.63, "learning_rate": 1.8927272727272728e-06, "loss": 0.3467, "step": 40650 }, { "epoch": 1.63, "learning_rate": 1.887676767676768e-06, "loss": 0.3754, "step": 40675 }, { "epoch": 1.63, "learning_rate": 1.8826262626262629e-06, "loss": 0.3749, "step": 40700 }, { "epoch": 1.63, "learning_rate": 1.8775757575757578e-06, "loss": 0.3766, "step": 40725 }, { "epoch": 1.63, "learning_rate": 1.8725252525252527e-06, "loss": 0.3737, "step": 40750 }, { "epoch": 1.64, "learning_rate": 1.8674747474747477e-06, "loss": 0.3661, "step": 40775 }, { "epoch": 1.64, "learning_rate": 1.8624242424242426e-06, "loss": 0.396, "step": 40800 }, { "epoch": 1.64, "learning_rate": 1.8573737373737375e-06, "loss": 0.3857, "step": 40825 }, { "epoch": 1.64, "learning_rate": 1.8523232323232325e-06, "loss": 0.3655, "step": 40850 }, { "epoch": 1.64, "learning_rate": 1.8472727272727276e-06, "loss": 0.3718, "step": 40875 }, { "epoch": 1.64, "learning_rate": 1.8422222222222225e-06, "loss": 0.3662, "step": 40900 }, { "epoch": 1.64, "learning_rate": 1.8371717171717175e-06, "loss": 0.3759, "step": 40925 }, { "epoch": 1.64, "learning_rate": 1.8321212121212124e-06, "loss": 0.3694, "step": 40950 }, { "epoch": 1.64, "learning_rate": 1.8270707070707071e-06, "loss": 0.3765, "step": 40975 }, { "epoch": 1.64, "learning_rate": 1.822020202020202e-06, "loss": 0.3684, "step": 41000 }, { "epoch": 1.65, "learning_rate": 1.816969696969697e-06, "loss": 0.3709, "step": 41025 }, { "epoch": 1.65, "learning_rate": 1.811919191919192e-06, "loss": 0.3516, "step": 41050 }, { "epoch": 1.65, "learning_rate": 1.8068686868686868e-06, "loss": 0.3558, "step": 41075 }, { "epoch": 1.65, "learning_rate": 1.801818181818182e-06, "loss": 0.3525, "step": 41100 }, { "epoch": 1.65, "learning_rate": 1.796767676767677e-06, "loss": 0.3709, "step": 41125 }, { "epoch": 1.65, "learning_rate": 1.7917171717171719e-06, "loss": 0.3559, "step": 41150 }, { "epoch": 1.65, "learning_rate": 1.7866666666666668e-06, "loss": 0.3896, "step": 41175 }, { "epoch": 1.65, "learning_rate": 1.7816161616161617e-06, "loss": 0.3619, "step": 41200 }, { "epoch": 1.65, "learning_rate": 1.7765656565656566e-06, "loss": 0.3749, "step": 41225 }, { "epoch": 1.65, "learning_rate": 1.7715151515151516e-06, "loss": 0.3763, "step": 41250 }, { "epoch": 1.66, "learning_rate": 1.7664646464646465e-06, "loss": 0.3526, "step": 41275 }, { "epoch": 1.66, "learning_rate": 1.7614141414141417e-06, "loss": 0.366, "step": 41300 }, { "epoch": 1.66, "learning_rate": 1.7563636363636366e-06, "loss": 0.367, "step": 41325 }, { "epoch": 1.66, "learning_rate": 1.7513131313131315e-06, "loss": 0.3867, "step": 41350 }, { "epoch": 1.66, "learning_rate": 1.7462626262626264e-06, "loss": 0.3798, "step": 41375 }, { "epoch": 1.66, "learning_rate": 1.7412121212121214e-06, "loss": 0.36, "step": 41400 }, { "epoch": 1.66, "learning_rate": 1.7361616161616163e-06, "loss": 0.3643, "step": 41425 }, { "epoch": 1.66, "learning_rate": 1.7311111111111112e-06, "loss": 0.3475, "step": 41450 }, { "epoch": 1.66, "learning_rate": 1.7260606060606062e-06, "loss": 0.3631, "step": 41475 }, { "epoch": 1.66, "learning_rate": 1.721010101010101e-06, "loss": 0.3672, "step": 41500 }, { "epoch": 1.67, "learning_rate": 1.7159595959595962e-06, "loss": 0.368, "step": 41525 }, { "epoch": 1.67, "learning_rate": 1.7109090909090912e-06, "loss": 0.3634, "step": 41550 }, { "epoch": 1.67, "learning_rate": 1.7058585858585861e-06, "loss": 0.3569, "step": 41575 }, { "epoch": 1.67, "learning_rate": 1.700808080808081e-06, "loss": 0.3395, "step": 41600 }, { "epoch": 1.67, "learning_rate": 1.695757575757576e-06, "loss": 0.3582, "step": 41625 }, { "epoch": 1.67, "learning_rate": 1.6907070707070707e-06, "loss": 0.3674, "step": 41650 }, { "epoch": 1.67, "learning_rate": 1.6856565656565656e-06, "loss": 0.377, "step": 41675 }, { "epoch": 1.67, "learning_rate": 1.680808080808081e-06, "loss": 0.3689, "step": 41700 }, { "epoch": 1.67, "learning_rate": 1.675757575757576e-06, "loss": 0.3744, "step": 41725 }, { "epoch": 1.67, "learning_rate": 1.6707070707070707e-06, "loss": 0.3565, "step": 41750 }, { "epoch": 1.68, "learning_rate": 1.6656565656565656e-06, "loss": 0.3623, "step": 41775 }, { "epoch": 1.68, "learning_rate": 1.6606060606060605e-06, "loss": 0.3758, "step": 41800 }, { "epoch": 1.68, "learning_rate": 1.6555555555555559e-06, "loss": 0.3699, "step": 41825 }, { "epoch": 1.68, "learning_rate": 1.6505050505050508e-06, "loss": 0.3665, "step": 41850 }, { "epoch": 1.68, "learning_rate": 1.6454545454545455e-06, "loss": 0.3513, "step": 41875 }, { "epoch": 1.68, "learning_rate": 1.6404040404040405e-06, "loss": 0.3731, "step": 41900 }, { "epoch": 1.68, "learning_rate": 1.6353535353535354e-06, "loss": 0.3793, "step": 41925 }, { "epoch": 1.68, "learning_rate": 1.6303030303030303e-06, "loss": 0.3615, "step": 41950 }, { "epoch": 1.68, "learning_rate": 1.6252525252525253e-06, "loss": 0.3517, "step": 41975 }, { "epoch": 1.68, "learning_rate": 1.6202020202020202e-06, "loss": 0.3619, "step": 42000 }, { "epoch": 1.69, "learning_rate": 1.6151515151515153e-06, "loss": 0.3916, "step": 42025 }, { "epoch": 1.69, "learning_rate": 1.6101010101010103e-06, "loss": 0.3582, "step": 42050 }, { "epoch": 1.69, "learning_rate": 1.6050505050505052e-06, "loss": 0.3558, "step": 42075 }, { "epoch": 1.69, "learning_rate": 1.6000000000000001e-06, "loss": 0.3679, "step": 42100 }, { "epoch": 1.69, "learning_rate": 1.594949494949495e-06, "loss": 0.3584, "step": 42125 }, { "epoch": 1.69, "learning_rate": 1.58989898989899e-06, "loss": 0.3667, "step": 42150 }, { "epoch": 1.69, "learning_rate": 1.584848484848485e-06, "loss": 0.3477, "step": 42175 }, { "epoch": 1.69, "learning_rate": 1.5797979797979799e-06, "loss": 0.3554, "step": 42200 }, { "epoch": 1.69, "learning_rate": 1.5747474747474748e-06, "loss": 0.3663, "step": 42225 }, { "epoch": 1.69, "learning_rate": 1.56969696969697e-06, "loss": 0.3485, "step": 42250 }, { "epoch": 1.7, "learning_rate": 1.5646464646464649e-06, "loss": 0.3515, "step": 42275 }, { "epoch": 1.7, "learning_rate": 1.5595959595959598e-06, "loss": 0.3592, "step": 42300 }, { "epoch": 1.7, "learning_rate": 1.5545454545454547e-06, "loss": 0.3737, "step": 42325 }, { "epoch": 1.7, "learning_rate": 1.5494949494949497e-06, "loss": 0.3788, "step": 42350 }, { "epoch": 1.7, "learning_rate": 1.5444444444444446e-06, "loss": 0.3592, "step": 42375 }, { "epoch": 1.7, "learning_rate": 1.5393939393939395e-06, "loss": 0.342, "step": 42400 }, { "epoch": 1.7, "learning_rate": 1.5343434343434345e-06, "loss": 0.3619, "step": 42425 }, { "epoch": 1.7, "learning_rate": 1.5292929292929296e-06, "loss": 0.3524, "step": 42450 }, { "epoch": 1.7, "learning_rate": 1.5242424242424245e-06, "loss": 0.3443, "step": 42475 }, { "epoch": 1.7, "learning_rate": 1.5191919191919195e-06, "loss": 0.3533, "step": 42500 }, { "epoch": 1.7, "eval_loss": 0.3833695948123932, "eval_runtime": 310.9704, "eval_samples_per_second": 16.095, "eval_steps_per_second": 2.013, "eval_wer": 27.969339566672204, "step": 42500 }, { "epoch": 1.71, "learning_rate": 1.5141414141414144e-06, "loss": 0.3873, "step": 42525 }, { "epoch": 1.71, "learning_rate": 1.5090909090909091e-06, "loss": 0.3634, "step": 42550 }, { "epoch": 1.71, "learning_rate": 1.504040404040404e-06, "loss": 0.3539, "step": 42575 }, { "epoch": 1.71, "learning_rate": 1.498989898989899e-06, "loss": 0.3574, "step": 42600 }, { "epoch": 1.71, "learning_rate": 1.493939393939394e-06, "loss": 0.3717, "step": 42625 }, { "epoch": 1.71, "learning_rate": 1.4888888888888888e-06, "loss": 0.3548, "step": 42650 }, { "epoch": 1.71, "learning_rate": 1.483838383838384e-06, "loss": 0.3441, "step": 42675 }, { "epoch": 1.71, "learning_rate": 1.478787878787879e-06, "loss": 0.3601, "step": 42700 }, { "epoch": 1.71, "learning_rate": 1.4737373737373739e-06, "loss": 0.3734, "step": 42725 }, { "epoch": 1.71, "learning_rate": 1.4686868686868688e-06, "loss": 0.3636, "step": 42750 }, { "epoch": 1.72, "learning_rate": 1.4636363636363637e-06, "loss": 0.366, "step": 42775 }, { "epoch": 1.72, "learning_rate": 1.4585858585858586e-06, "loss": 0.3627, "step": 42800 }, { "epoch": 1.72, "learning_rate": 1.4535353535353536e-06, "loss": 0.3757, "step": 42825 }, { "epoch": 1.72, "learning_rate": 1.4484848484848485e-06, "loss": 0.3681, "step": 42850 }, { "epoch": 1.72, "learning_rate": 1.4434343434343437e-06, "loss": 0.3629, "step": 42875 }, { "epoch": 1.72, "learning_rate": 1.4383838383838386e-06, "loss": 0.3865, "step": 42900 }, { "epoch": 1.72, "learning_rate": 1.4333333333333335e-06, "loss": 0.3495, "step": 42925 }, { "epoch": 1.72, "learning_rate": 1.4282828282828284e-06, "loss": 0.3639, "step": 42950 }, { "epoch": 1.72, "learning_rate": 1.4232323232323234e-06, "loss": 0.3836, "step": 42975 }, { "epoch": 1.72, "learning_rate": 1.4181818181818183e-06, "loss": 0.339, "step": 43000 }, { "epoch": 1.73, "learning_rate": 1.4131313131313132e-06, "loss": 0.3689, "step": 43025 }, { "epoch": 1.73, "learning_rate": 1.4080808080808082e-06, "loss": 0.3676, "step": 43050 }, { "epoch": 1.73, "learning_rate": 1.403030303030303e-06, "loss": 0.3709, "step": 43075 }, { "epoch": 1.73, "learning_rate": 1.3979797979797982e-06, "loss": 0.3642, "step": 43100 }, { "epoch": 1.73, "learning_rate": 1.3929292929292932e-06, "loss": 0.3747, "step": 43125 }, { "epoch": 1.73, "learning_rate": 1.3878787878787881e-06, "loss": 0.377, "step": 43150 }, { "epoch": 1.73, "learning_rate": 1.382828282828283e-06, "loss": 0.3567, "step": 43175 }, { "epoch": 1.73, "learning_rate": 1.377777777777778e-06, "loss": 0.3613, "step": 43200 }, { "epoch": 1.73, "learning_rate": 1.3727272727272727e-06, "loss": 0.3624, "step": 43225 }, { "epoch": 1.73, "learning_rate": 1.3676767676767676e-06, "loss": 0.3782, "step": 43250 }, { "epoch": 1.74, "learning_rate": 1.3626262626262626e-06, "loss": 0.3644, "step": 43275 }, { "epoch": 1.74, "learning_rate": 1.357575757575758e-06, "loss": 0.3648, "step": 43300 }, { "epoch": 1.74, "learning_rate": 1.3525252525252528e-06, "loss": 0.3521, "step": 43325 }, { "epoch": 1.74, "learning_rate": 1.3474747474747476e-06, "loss": 0.3833, "step": 43350 }, { "epoch": 1.74, "learning_rate": 1.3424242424242425e-06, "loss": 0.3597, "step": 43375 }, { "epoch": 1.74, "learning_rate": 1.3373737373737374e-06, "loss": 0.3648, "step": 43400 }, { "epoch": 1.74, "learning_rate": 1.3323232323232324e-06, "loss": 0.3674, "step": 43425 }, { "epoch": 1.74, "learning_rate": 1.3272727272727273e-06, "loss": 0.3361, "step": 43450 }, { "epoch": 1.74, "learning_rate": 1.3222222222222222e-06, "loss": 0.36, "step": 43475 }, { "epoch": 1.74, "learning_rate": 1.3171717171717172e-06, "loss": 0.3592, "step": 43500 }, { "epoch": 1.75, "learning_rate": 1.3121212121212123e-06, "loss": 0.3741, "step": 43525 }, { "epoch": 1.75, "learning_rate": 1.3070707070707072e-06, "loss": 0.36, "step": 43550 }, { "epoch": 1.75, "learning_rate": 1.3020202020202022e-06, "loss": 0.3622, "step": 43575 }, { "epoch": 1.75, "learning_rate": 1.296969696969697e-06, "loss": 0.3577, "step": 43600 }, { "epoch": 1.75, "learning_rate": 1.291919191919192e-06, "loss": 0.3591, "step": 43625 }, { "epoch": 1.75, "learning_rate": 1.286868686868687e-06, "loss": 0.3711, "step": 43650 }, { "epoch": 1.75, "learning_rate": 1.2818181818181819e-06, "loss": 0.3559, "step": 43675 }, { "epoch": 1.75, "learning_rate": 1.276969696969697e-06, "loss": 0.3399, "step": 43700 }, { "epoch": 1.75, "learning_rate": 1.271919191919192e-06, "loss": 0.3564, "step": 43725 }, { "epoch": 1.75, "learning_rate": 1.266868686868687e-06, "loss": 0.3511, "step": 43750 }, { "epoch": 1.76, "learning_rate": 1.2618181818181819e-06, "loss": 0.3581, "step": 43775 }, { "epoch": 1.76, "learning_rate": 1.2567676767676768e-06, "loss": 0.3699, "step": 43800 }, { "epoch": 1.76, "learning_rate": 1.251717171717172e-06, "loss": 0.3608, "step": 43825 }, { "epoch": 1.76, "learning_rate": 1.2466666666666667e-06, "loss": 0.4034, "step": 43850 }, { "epoch": 1.76, "learning_rate": 1.2416161616161618e-06, "loss": 0.3626, "step": 43875 }, { "epoch": 1.76, "learning_rate": 1.2365656565656567e-06, "loss": 0.3781, "step": 43900 }, { "epoch": 1.76, "learning_rate": 1.2315151515151517e-06, "loss": 0.3429, "step": 43925 }, { "epoch": 1.76, "learning_rate": 1.2264646464646466e-06, "loss": 0.3661, "step": 43950 }, { "epoch": 1.76, "learning_rate": 1.2214141414141415e-06, "loss": 0.3534, "step": 43975 }, { "epoch": 1.76, "learning_rate": 1.2163636363636365e-06, "loss": 0.3589, "step": 44000 }, { "epoch": 1.77, "learning_rate": 1.2113131313131314e-06, "loss": 0.3432, "step": 44025 }, { "epoch": 1.77, "learning_rate": 1.2062626262626263e-06, "loss": 0.3779, "step": 44050 }, { "epoch": 1.77, "learning_rate": 1.2012121212121213e-06, "loss": 0.3539, "step": 44075 }, { "epoch": 1.77, "learning_rate": 1.1961616161616164e-06, "loss": 0.3715, "step": 44100 }, { "epoch": 1.77, "learning_rate": 1.1911111111111111e-06, "loss": 0.3593, "step": 44125 }, { "epoch": 1.77, "learning_rate": 1.186060606060606e-06, "loss": 0.375, "step": 44150 }, { "epoch": 1.77, "learning_rate": 1.181010101010101e-06, "loss": 0.3881, "step": 44175 }, { "epoch": 1.77, "learning_rate": 1.1759595959595961e-06, "loss": 0.3624, "step": 44200 }, { "epoch": 1.77, "learning_rate": 1.170909090909091e-06, "loss": 0.3858, "step": 44225 }, { "epoch": 1.77, "learning_rate": 1.165858585858586e-06, "loss": 0.3705, "step": 44250 }, { "epoch": 1.78, "learning_rate": 1.160808080808081e-06, "loss": 0.3474, "step": 44275 }, { "epoch": 1.78, "learning_rate": 1.1557575757575759e-06, "loss": 0.3674, "step": 44300 }, { "epoch": 1.78, "learning_rate": 1.1507070707070708e-06, "loss": 0.3706, "step": 44325 }, { "epoch": 1.78, "learning_rate": 1.1456565656565657e-06, "loss": 0.3674, "step": 44350 }, { "epoch": 1.78, "learning_rate": 1.1406060606060606e-06, "loss": 0.367, "step": 44375 }, { "epoch": 1.78, "learning_rate": 1.1355555555555558e-06, "loss": 0.3647, "step": 44400 }, { "epoch": 1.78, "learning_rate": 1.1305050505050507e-06, "loss": 0.3667, "step": 44425 }, { "epoch": 1.78, "learning_rate": 1.1254545454545457e-06, "loss": 0.3557, "step": 44450 }, { "epoch": 1.78, "learning_rate": 1.1204040404040404e-06, "loss": 0.3523, "step": 44475 }, { "epoch": 1.78, "learning_rate": 1.1153535353535353e-06, "loss": 0.3559, "step": 44500 }, { "epoch": 1.79, "learning_rate": 1.1103030303030304e-06, "loss": 0.3484, "step": 44525 }, { "epoch": 1.79, "learning_rate": 1.1052525252525254e-06, "loss": 0.372, "step": 44550 }, { "epoch": 1.79, "learning_rate": 1.1002020202020203e-06, "loss": 0.3515, "step": 44575 }, { "epoch": 1.79, "learning_rate": 1.0951515151515152e-06, "loss": 0.3759, "step": 44600 }, { "epoch": 1.79, "learning_rate": 1.0901010101010102e-06, "loss": 0.3682, "step": 44625 }, { "epoch": 1.79, "learning_rate": 1.085050505050505e-06, "loss": 0.362, "step": 44650 }, { "epoch": 1.79, "learning_rate": 1.08e-06, "loss": 0.3558, "step": 44675 }, { "epoch": 1.79, "learning_rate": 1.074949494949495e-06, "loss": 0.3483, "step": 44700 }, { "epoch": 1.79, "learning_rate": 1.0698989898989901e-06, "loss": 0.3358, "step": 44725 }, { "epoch": 1.79, "learning_rate": 1.064848484848485e-06, "loss": 0.3726, "step": 44750 }, { "epoch": 1.8, "learning_rate": 1.05979797979798e-06, "loss": 0.3698, "step": 44775 }, { "epoch": 1.8, "learning_rate": 1.0547474747474747e-06, "loss": 0.3674, "step": 44800 }, { "epoch": 1.8, "learning_rate": 1.0496969696969696e-06, "loss": 0.3718, "step": 44825 }, { "epoch": 1.8, "learning_rate": 1.0446464646464648e-06, "loss": 0.3684, "step": 44850 }, { "epoch": 1.8, "learning_rate": 1.0395959595959597e-06, "loss": 0.3546, "step": 44875 }, { "epoch": 1.8, "learning_rate": 1.0345454545454546e-06, "loss": 0.357, "step": 44900 }, { "epoch": 1.8, "learning_rate": 1.0294949494949496e-06, "loss": 0.3537, "step": 44925 }, { "epoch": 1.8, "learning_rate": 1.0244444444444445e-06, "loss": 0.3616, "step": 44950 }, { "epoch": 1.8, "learning_rate": 1.0193939393939394e-06, "loss": 0.349, "step": 44975 }, { "epoch": 1.8, "learning_rate": 1.0143434343434344e-06, "loss": 0.3594, "step": 45000 }, { "epoch": 1.8, "eval_loss": 0.38151976466178894, "eval_runtime": 308.7744, "eval_samples_per_second": 16.209, "eval_steps_per_second": 2.027, "eval_wer": 28.856878426161035, "step": 45000 }, { "epoch": 1.81, "learning_rate": 1.0092929292929293e-06, "loss": 0.3538, "step": 45025 }, { "epoch": 1.81, "learning_rate": 1.0042424242424244e-06, "loss": 0.3699, "step": 45050 }, { "epoch": 1.81, "learning_rate": 9.991919191919194e-07, "loss": 0.3676, "step": 45075 }, { "epoch": 1.81, "learning_rate": 9.941414141414143e-07, "loss": 0.3679, "step": 45100 }, { "epoch": 1.81, "learning_rate": 9.890909090909092e-07, "loss": 0.3621, "step": 45125 }, { "epoch": 1.81, "learning_rate": 9.840404040404042e-07, "loss": 0.3517, "step": 45150 }, { "epoch": 1.81, "learning_rate": 9.78989898989899e-07, "loss": 0.3819, "step": 45175 }, { "epoch": 1.81, "learning_rate": 9.73939393939394e-07, "loss": 0.3628, "step": 45200 }, { "epoch": 1.81, "learning_rate": 9.68888888888889e-07, "loss": 0.3475, "step": 45225 }, { "epoch": 1.81, "learning_rate": 9.638383838383839e-07, "loss": 0.3486, "step": 45250 }, { "epoch": 1.82, "learning_rate": 9.587878787878788e-07, "loss": 0.3573, "step": 45275 }, { "epoch": 1.82, "learning_rate": 9.537373737373737e-07, "loss": 0.3664, "step": 45300 }, { "epoch": 1.82, "learning_rate": 9.486868686868688e-07, "loss": 0.3648, "step": 45325 }, { "epoch": 1.82, "learning_rate": 9.436363636363636e-07, "loss": 0.3614, "step": 45350 }, { "epoch": 1.82, "learning_rate": 9.385858585858588e-07, "loss": 0.3586, "step": 45375 }, { "epoch": 1.82, "learning_rate": 9.335353535353536e-07, "loss": 0.3629, "step": 45400 }, { "epoch": 1.82, "learning_rate": 9.284848484848485e-07, "loss": 0.38, "step": 45425 }, { "epoch": 1.82, "learning_rate": 9.234343434343434e-07, "loss": 0.3636, "step": 45450 }, { "epoch": 1.82, "learning_rate": 9.183838383838385e-07, "loss": 0.3382, "step": 45475 }, { "epoch": 1.82, "learning_rate": 9.133333333333334e-07, "loss": 0.3504, "step": 45500 }, { "epoch": 1.83, "learning_rate": 9.082828282828283e-07, "loss": 0.3541, "step": 45525 }, { "epoch": 1.83, "learning_rate": 9.032323232323233e-07, "loss": 0.3672, "step": 45550 }, { "epoch": 1.83, "learning_rate": 8.981818181818183e-07, "loss": 0.3681, "step": 45575 }, { "epoch": 1.83, "learning_rate": 8.931313131313132e-07, "loss": 0.3692, "step": 45600 }, { "epoch": 1.83, "learning_rate": 8.880808080808082e-07, "loss": 0.3579, "step": 45625 }, { "epoch": 1.83, "learning_rate": 8.830303030303031e-07, "loss": 0.3597, "step": 45650 }, { "epoch": 1.83, "learning_rate": 8.77979797979798e-07, "loss": 0.3499, "step": 45675 }, { "epoch": 1.83, "learning_rate": 8.729292929292931e-07, "loss": 0.3556, "step": 45700 }, { "epoch": 1.83, "learning_rate": 8.680808080808082e-07, "loss": 0.3659, "step": 45725 }, { "epoch": 1.83, "learning_rate": 8.630303030303031e-07, "loss": 0.3677, "step": 45750 }, { "epoch": 1.84, "learning_rate": 8.579797979797981e-07, "loss": 0.352, "step": 45775 }, { "epoch": 1.84, "learning_rate": 8.529292929292931e-07, "loss": 0.3722, "step": 45800 }, { "epoch": 1.84, "learning_rate": 8.47878787878788e-07, "loss": 0.353, "step": 45825 }, { "epoch": 1.84, "learning_rate": 8.428282828282828e-07, "loss": 0.3546, "step": 45850 }, { "epoch": 1.84, "learning_rate": 8.37777777777778e-07, "loss": 0.3588, "step": 45875 }, { "epoch": 1.84, "learning_rate": 8.327272727272728e-07, "loss": 0.367, "step": 45900 }, { "epoch": 1.84, "learning_rate": 8.276767676767677e-07, "loss": 0.3414, "step": 45925 }, { "epoch": 1.84, "learning_rate": 8.226262626262626e-07, "loss": 0.3635, "step": 45950 }, { "epoch": 1.84, "learning_rate": 8.175757575757576e-07, "loss": 0.3416, "step": 45975 }, { "epoch": 1.84, "learning_rate": 8.125252525252526e-07, "loss": 0.3722, "step": 46000 }, { "epoch": 1.85, "learning_rate": 8.074747474747475e-07, "loss": 0.3616, "step": 46025 }, { "epoch": 1.85, "learning_rate": 8.024242424242425e-07, "loss": 0.3517, "step": 46050 }, { "epoch": 1.85, "learning_rate": 7.973737373737374e-07, "loss": 0.3687, "step": 46075 }, { "epoch": 1.85, "learning_rate": 7.923232323232324e-07, "loss": 0.3546, "step": 46100 }, { "epoch": 1.85, "learning_rate": 7.872727272727274e-07, "loss": 0.3582, "step": 46125 }, { "epoch": 1.85, "learning_rate": 7.822222222222223e-07, "loss": 0.357, "step": 46150 }, { "epoch": 1.85, "learning_rate": 7.771717171717172e-07, "loss": 0.3703, "step": 46175 }, { "epoch": 1.85, "learning_rate": 7.721212121212123e-07, "loss": 0.3619, "step": 46200 }, { "epoch": 1.85, "learning_rate": 7.670707070707072e-07, "loss": 0.3441, "step": 46225 }, { "epoch": 1.85, "learning_rate": 7.62020202020202e-07, "loss": 0.3565, "step": 46250 }, { "epoch": 1.86, "learning_rate": 7.56969696969697e-07, "loss": 0.3517, "step": 46275 }, { "epoch": 1.86, "learning_rate": 7.51919191919192e-07, "loss": 0.3505, "step": 46300 }, { "epoch": 1.86, "learning_rate": 7.468686868686869e-07, "loss": 0.3691, "step": 46325 }, { "epoch": 1.86, "learning_rate": 7.418181818181819e-07, "loss": 0.3626, "step": 46350 }, { "epoch": 1.86, "learning_rate": 7.367676767676768e-07, "loss": 0.3582, "step": 46375 }, { "epoch": 1.86, "learning_rate": 7.317171717171717e-07, "loss": 0.3677, "step": 46400 }, { "epoch": 1.86, "learning_rate": 7.266666666666668e-07, "loss": 0.3636, "step": 46425 }, { "epoch": 1.86, "learning_rate": 7.216161616161617e-07, "loss": 0.3677, "step": 46450 }, { "epoch": 1.86, "learning_rate": 7.165656565656566e-07, "loss": 0.3497, "step": 46475 }, { "epoch": 1.86, "learning_rate": 7.115151515151516e-07, "loss": 0.3627, "step": 46500 }, { "epoch": 1.87, "learning_rate": 7.064646464646466e-07, "loss": 0.3588, "step": 46525 }, { "epoch": 1.87, "learning_rate": 7.014141414141415e-07, "loss": 0.3537, "step": 46550 }, { "epoch": 1.87, "learning_rate": 6.963636363636364e-07, "loss": 0.357, "step": 46575 }, { "epoch": 1.87, "learning_rate": 6.913131313131313e-07, "loss": 0.3552, "step": 46600 }, { "epoch": 1.87, "learning_rate": 6.862626262626264e-07, "loss": 0.3761, "step": 46625 }, { "epoch": 1.87, "learning_rate": 6.812121212121213e-07, "loss": 0.3831, "step": 46650 }, { "epoch": 1.87, "learning_rate": 6.761616161616162e-07, "loss": 0.3443, "step": 46675 }, { "epoch": 1.87, "learning_rate": 6.711111111111111e-07, "loss": 0.3653, "step": 46700 }, { "epoch": 1.87, "learning_rate": 6.66060606060606e-07, "loss": 0.3495, "step": 46725 }, { "epoch": 1.87, "learning_rate": 6.610101010101011e-07, "loss": 0.3669, "step": 46750 }, { "epoch": 1.88, "learning_rate": 6.55959595959596e-07, "loss": 0.3691, "step": 46775 }, { "epoch": 1.88, "learning_rate": 6.50909090909091e-07, "loss": 0.3505, "step": 46800 }, { "epoch": 1.88, "learning_rate": 6.458585858585859e-07, "loss": 0.3646, "step": 46825 }, { "epoch": 1.88, "learning_rate": 6.408080808080809e-07, "loss": 0.3684, "step": 46850 }, { "epoch": 1.88, "learning_rate": 6.357575757575759e-07, "loss": 0.3579, "step": 46875 }, { "epoch": 1.88, "learning_rate": 6.307070707070708e-07, "loss": 0.3586, "step": 46900 }, { "epoch": 1.88, "learning_rate": 6.256565656565656e-07, "loss": 0.3602, "step": 46925 }, { "epoch": 1.88, "learning_rate": 6.206060606060606e-07, "loss": 0.3524, "step": 46950 }, { "epoch": 1.88, "learning_rate": 6.155555555555556e-07, "loss": 0.3422, "step": 46975 }, { "epoch": 1.88, "learning_rate": 6.105050505050505e-07, "loss": 0.3642, "step": 47000 }, { "epoch": 1.89, "learning_rate": 6.054545454545455e-07, "loss": 0.3673, "step": 47025 }, { "epoch": 1.89, "learning_rate": 6.004040404040405e-07, "loss": 0.3477, "step": 47050 }, { "epoch": 1.89, "learning_rate": 5.953535353535354e-07, "loss": 0.3442, "step": 47075 }, { "epoch": 1.89, "learning_rate": 5.903030303030303e-07, "loss": 0.3736, "step": 47100 }, { "epoch": 1.89, "learning_rate": 5.852525252525253e-07, "loss": 0.3658, "step": 47125 }, { "epoch": 1.89, "learning_rate": 5.802020202020202e-07, "loss": 0.3574, "step": 47150 }, { "epoch": 1.89, "learning_rate": 5.751515151515151e-07, "loss": 0.357, "step": 47175 }, { "epoch": 1.89, "learning_rate": 5.701010101010102e-07, "loss": 0.3691, "step": 47200 }, { "epoch": 1.89, "learning_rate": 5.650505050505051e-07, "loss": 0.3572, "step": 47225 }, { "epoch": 1.89, "learning_rate": 5.6e-07, "loss": 0.3423, "step": 47250 }, { "epoch": 1.9, "learning_rate": 5.54949494949495e-07, "loss": 0.3505, "step": 47275 }, { "epoch": 1.9, "learning_rate": 5.4989898989899e-07, "loss": 0.3661, "step": 47300 }, { "epoch": 1.9, "learning_rate": 5.448484848484848e-07, "loss": 0.3482, "step": 47325 }, { "epoch": 1.9, "learning_rate": 5.397979797979799e-07, "loss": 0.366, "step": 47350 }, { "epoch": 1.9, "learning_rate": 5.347474747474748e-07, "loss": 0.3585, "step": 47375 }, { "epoch": 1.9, "learning_rate": 5.296969696969697e-07, "loss": 0.3755, "step": 47400 }, { "epoch": 1.9, "learning_rate": 5.246464646464647e-07, "loss": 0.356, "step": 47425 }, { "epoch": 1.9, "learning_rate": 5.195959595959597e-07, "loss": 0.3426, "step": 47450 }, { "epoch": 1.9, "learning_rate": 5.145454545454546e-07, "loss": 0.3696, "step": 47475 }, { "epoch": 1.9, "learning_rate": 5.094949494949496e-07, "loss": 0.3628, "step": 47500 }, { "epoch": 1.9, "eval_loss": 0.38016417622566223, "eval_runtime": 305.1241, "eval_samples_per_second": 16.403, "eval_steps_per_second": 2.052, "eval_wer": 28.12596407128788, "step": 47500 }, { "epoch": 1.91, "learning_rate": 5.044444444444445e-07, "loss": 0.349, "step": 47525 }, { "epoch": 1.91, "learning_rate": 4.993939393939394e-07, "loss": 0.3586, "step": 47550 }, { "epoch": 1.91, "learning_rate": 4.943434343434344e-07, "loss": 0.3719, "step": 47575 }, { "epoch": 1.91, "learning_rate": 4.892929292929293e-07, "loss": 0.3709, "step": 47600 }, { "epoch": 1.91, "learning_rate": 4.842424242424243e-07, "loss": 0.3573, "step": 47625 }, { "epoch": 1.91, "learning_rate": 4.791919191919193e-07, "loss": 0.3461, "step": 47650 }, { "epoch": 1.91, "learning_rate": 4.741414141414142e-07, "loss": 0.3678, "step": 47675 }, { "epoch": 1.91, "learning_rate": 4.690909090909091e-07, "loss": 0.3563, "step": 47700 }, { "epoch": 1.91, "learning_rate": 4.640404040404041e-07, "loss": 0.3588, "step": 47725 }, { "epoch": 1.91, "learning_rate": 4.5898989898989904e-07, "loss": 0.3578, "step": 47750 }, { "epoch": 1.92, "learning_rate": 4.5414141414141417e-07, "loss": 0.3741, "step": 47775 }, { "epoch": 1.92, "learning_rate": 4.4909090909090916e-07, "loss": 0.3793, "step": 47800 }, { "epoch": 1.92, "learning_rate": 4.440404040404041e-07, "loss": 0.3776, "step": 47825 }, { "epoch": 1.92, "learning_rate": 4.38989898989899e-07, "loss": 0.3486, "step": 47850 }, { "epoch": 1.92, "learning_rate": 4.33939393939394e-07, "loss": 0.362, "step": 47875 }, { "epoch": 1.92, "learning_rate": 4.288888888888889e-07, "loss": 0.3597, "step": 47900 }, { "epoch": 1.92, "learning_rate": 4.2383838383838387e-07, "loss": 0.3692, "step": 47925 }, { "epoch": 1.92, "learning_rate": 4.187878787878788e-07, "loss": 0.3558, "step": 47950 }, { "epoch": 1.92, "learning_rate": 4.137373737373738e-07, "loss": 0.3565, "step": 47975 }, { "epoch": 1.92, "learning_rate": 4.086868686868687e-07, "loss": 0.3516, "step": 48000 }, { "epoch": 1.93, "learning_rate": 4.036363636363637e-07, "loss": 0.3644, "step": 48025 }, { "epoch": 1.93, "learning_rate": 3.985858585858586e-07, "loss": 0.3622, "step": 48050 }, { "epoch": 1.93, "learning_rate": 3.935353535353536e-07, "loss": 0.3378, "step": 48075 }, { "epoch": 1.93, "learning_rate": 3.884848484848485e-07, "loss": 0.3791, "step": 48100 }, { "epoch": 1.93, "learning_rate": 3.834343434343435e-07, "loss": 0.3635, "step": 48125 }, { "epoch": 1.93, "learning_rate": 3.783838383838384e-07, "loss": 0.3637, "step": 48150 }, { "epoch": 1.93, "learning_rate": 3.733333333333334e-07, "loss": 0.3659, "step": 48175 }, { "epoch": 1.93, "learning_rate": 3.682828282828283e-07, "loss": 0.354, "step": 48200 }, { "epoch": 1.93, "learning_rate": 3.632323232323232e-07, "loss": 0.3786, "step": 48225 }, { "epoch": 1.93, "learning_rate": 3.581818181818182e-07, "loss": 0.3566, "step": 48250 }, { "epoch": 1.94, "learning_rate": 3.531313131313131e-07, "loss": 0.3541, "step": 48275 }, { "epoch": 1.94, "learning_rate": 3.480808080808081e-07, "loss": 0.3627, "step": 48300 }, { "epoch": 1.94, "learning_rate": 3.4303030303030304e-07, "loss": 0.3565, "step": 48325 }, { "epoch": 1.94, "learning_rate": 3.37979797979798e-07, "loss": 0.3752, "step": 48350 }, { "epoch": 1.94, "learning_rate": 3.3292929292929295e-07, "loss": 0.3762, "step": 48375 }, { "epoch": 1.94, "learning_rate": 3.2787878787878794e-07, "loss": 0.3475, "step": 48400 }, { "epoch": 1.94, "learning_rate": 3.228282828282828e-07, "loss": 0.3726, "step": 48425 }, { "epoch": 1.94, "learning_rate": 3.177777777777778e-07, "loss": 0.3556, "step": 48450 }, { "epoch": 1.94, "learning_rate": 3.1272727272727273e-07, "loss": 0.4022, "step": 48475 }, { "epoch": 1.94, "learning_rate": 3.076767676767677e-07, "loss": 0.3513, "step": 48500 }, { "epoch": 1.95, "learning_rate": 3.0262626262626265e-07, "loss": 0.355, "step": 48525 }, { "epoch": 1.95, "learning_rate": 2.975757575757576e-07, "loss": 0.3733, "step": 48550 }, { "epoch": 1.95, "learning_rate": 2.9252525252525256e-07, "loss": 0.3635, "step": 48575 }, { "epoch": 1.95, "learning_rate": 2.874747474747475e-07, "loss": 0.3639, "step": 48600 }, { "epoch": 1.95, "learning_rate": 2.8242424242424243e-07, "loss": 0.3438, "step": 48625 }, { "epoch": 1.95, "learning_rate": 2.773737373737374e-07, "loss": 0.3616, "step": 48650 }, { "epoch": 1.95, "learning_rate": 2.7232323232323234e-07, "loss": 0.3639, "step": 48675 }, { "epoch": 1.95, "learning_rate": 2.6727272727272733e-07, "loss": 0.3542, "step": 48700 }, { "epoch": 1.95, "learning_rate": 2.6222222222222226e-07, "loss": 0.3455, "step": 48725 }, { "epoch": 1.95, "learning_rate": 2.571717171717172e-07, "loss": 0.3833, "step": 48750 }, { "epoch": 1.96, "learning_rate": 2.521212121212122e-07, "loss": 0.359, "step": 48775 }, { "epoch": 1.96, "learning_rate": 2.470707070707071e-07, "loss": 0.3734, "step": 48800 }, { "epoch": 1.96, "learning_rate": 2.4202020202020204e-07, "loss": 0.3745, "step": 48825 }, { "epoch": 1.96, "learning_rate": 2.3696969696969697e-07, "loss": 0.3558, "step": 48850 }, { "epoch": 1.96, "learning_rate": 2.3191919191919193e-07, "loss": 0.3513, "step": 48875 }, { "epoch": 1.96, "learning_rate": 2.2686868686868689e-07, "loss": 0.3703, "step": 48900 }, { "epoch": 1.96, "learning_rate": 2.2181818181818182e-07, "loss": 0.3623, "step": 48925 }, { "epoch": 1.96, "learning_rate": 2.1676767676767677e-07, "loss": 0.3853, "step": 48950 }, { "epoch": 1.96, "learning_rate": 2.1171717171717173e-07, "loss": 0.3714, "step": 48975 }, { "epoch": 1.96, "learning_rate": 2.066666666666667e-07, "loss": 0.3584, "step": 49000 }, { "epoch": 1.97, "learning_rate": 2.0161616161616162e-07, "loss": 0.3547, "step": 49025 }, { "epoch": 1.97, "learning_rate": 1.9656565656565658e-07, "loss": 0.3564, "step": 49050 }, { "epoch": 1.97, "learning_rate": 1.9151515151515154e-07, "loss": 0.3501, "step": 49075 }, { "epoch": 1.97, "learning_rate": 1.864646464646465e-07, "loss": 0.3717, "step": 49100 }, { "epoch": 1.97, "learning_rate": 1.8141414141414143e-07, "loss": 0.3698, "step": 49125 }, { "epoch": 1.97, "learning_rate": 1.7636363636363639e-07, "loss": 0.3603, "step": 49150 }, { "epoch": 1.97, "learning_rate": 1.7131313131313134e-07, "loss": 0.37, "step": 49175 }, { "epoch": 1.97, "learning_rate": 1.662626262626263e-07, "loss": 0.3386, "step": 49200 }, { "epoch": 1.97, "learning_rate": 1.612121212121212e-07, "loss": 0.3509, "step": 49225 }, { "epoch": 1.97, "learning_rate": 1.5616161616161617e-07, "loss": 0.3479, "step": 49250 }, { "epoch": 1.98, "learning_rate": 1.5111111111111112e-07, "loss": 0.3466, "step": 49275 }, { "epoch": 1.98, "learning_rate": 1.4606060606060608e-07, "loss": 0.3577, "step": 49300 }, { "epoch": 1.98, "learning_rate": 1.41010101010101e-07, "loss": 0.366, "step": 49325 }, { "epoch": 1.98, "learning_rate": 1.3595959595959597e-07, "loss": 0.387, "step": 49350 }, { "epoch": 1.98, "learning_rate": 1.3090909090909093e-07, "loss": 0.3762, "step": 49375 }, { "epoch": 1.98, "learning_rate": 1.2585858585858586e-07, "loss": 0.3528, "step": 49400 }, { "epoch": 1.98, "learning_rate": 1.2080808080808082e-07, "loss": 0.372, "step": 49425 }, { "epoch": 1.98, "learning_rate": 1.1575757575757578e-07, "loss": 0.3442, "step": 49450 }, { "epoch": 1.98, "learning_rate": 1.1070707070707072e-07, "loss": 0.3603, "step": 49475 }, { "epoch": 1.98, "learning_rate": 1.0565656565656568e-07, "loss": 0.3604, "step": 49500 }, { "epoch": 1.99, "learning_rate": 1.0060606060606061e-07, "loss": 0.3561, "step": 49525 }, { "epoch": 1.99, "learning_rate": 9.555555555555556e-08, "loss": 0.3634, "step": 49550 }, { "epoch": 1.99, "learning_rate": 9.050505050505051e-08, "loss": 0.361, "step": 49575 }, { "epoch": 1.99, "learning_rate": 8.545454545454546e-08, "loss": 0.3529, "step": 49600 }, { "epoch": 1.99, "learning_rate": 8.040404040404042e-08, "loss": 0.358, "step": 49625 }, { "epoch": 1.99, "learning_rate": 7.535353535353536e-08, "loss": 0.352, "step": 49650 }, { "epoch": 1.99, "learning_rate": 7.03030303030303e-08, "loss": 0.3733, "step": 49675 }, { "epoch": 1.99, "learning_rate": 6.525252525252525e-08, "loss": 0.3568, "step": 49700 }, { "epoch": 1.99, "learning_rate": 6.020202020202021e-08, "loss": 0.3649, "step": 49725 }, { "epoch": 1.99, "learning_rate": 5.515151515151516e-08, "loss": 0.3645, "step": 49750 }, { "epoch": 2.0, "learning_rate": 5.0101010101010105e-08, "loss": 0.3589, "step": 49775 }, { "epoch": 2.0, "learning_rate": 4.5252525252525257e-08, "loss": 0.3687, "step": 49800 }, { "epoch": 2.0, "learning_rate": 4.020202020202021e-08, "loss": 0.3764, "step": 49825 }, { "epoch": 2.0, "learning_rate": 3.515151515151515e-08, "loss": 0.3622, "step": 49850 }, { "epoch": 2.0, "learning_rate": 3.0101010101010104e-08, "loss": 0.349, "step": 49875 }, { "epoch": 2.0, "learning_rate": 2.5050505050505052e-08, "loss": 0.3612, "step": 49900 }, { "epoch": 2.0, "learning_rate": 2e-08, "loss": 0.358, "step": 49925 }, { "epoch": 2.0, "learning_rate": 1.4949494949494952e-08, "loss": 0.3431, "step": 49950 }, { "epoch": 2.0, "learning_rate": 9.8989898989899e-09, "loss": 0.353, "step": 49975 }, { "epoch": 2.0, "learning_rate": 4.848484848484849e-09, "loss": 0.3392, "step": 50000 }, { "epoch": 2.0, "eval_loss": 0.37952831387519836, "eval_runtime": 312.4104, "eval_samples_per_second": 16.021, "eval_steps_per_second": 2.004, "eval_wer": 28.726358005647974, "step": 50000 }, { "epoch": 2.0, "step": 50000, "total_flos": 9.7854051981312e+19, "train_loss": 0.47914609115600587, "train_runtime": 101277.4875, "train_samples_per_second": 31.596, "train_steps_per_second": 0.494 } ], "logging_steps": 25, "max_steps": 50000, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 2500, "total_flos": 9.7854051981312e+19, "train_batch_size": 64, "trial_name": null, "trial_params": null }