diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,62406 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 4.999674054758801, + "eval_steps": 500, + "global_step": 51130, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 1e-08, + "loss": 0.3429, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 2e-08, + "loss": 0.2779, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 2.8e-08, + "loss": 0.3114, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 3.7999999999999996e-08, + "loss": 0.3972, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 4.8000000000000006e-08, + "loss": 0.3104, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 5.6e-08, + "loss": 0.3122, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 6.600000000000001e-08, + "loss": 0.4011, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 7.599999999999999e-08, + "loss": 0.3115, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 8.6e-08, + "loss": 0.334, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 9.600000000000001e-08, + "loss": 0.315, + "step": 50 + }, + { + "epoch": 0.01, + "learning_rate": 1.06e-07, + "loss": 0.3668, + "step": 55 + }, + { + "epoch": 0.01, + "learning_rate": 1.16e-07, + "loss": 0.2968, + "step": 60 + }, + { + "epoch": 0.01, + "learning_rate": 1.26e-07, + "loss": 0.3175, + "step": 65 + }, + { + "epoch": 0.01, + "learning_rate": 1.36e-07, + "loss": 0.3536, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 1.46e-07, + "loss": 0.3557, + "step": 75 + }, + { + "epoch": 0.01, + "learning_rate": 1.56e-07, + "loss": 0.2975, + "step": 80 + }, + { + "epoch": 0.01, + "learning_rate": 1.66e-07, + "loss": 0.3909, + "step": 85 + }, + { + "epoch": 0.01, + "learning_rate": 1.7600000000000001e-07, + "loss": 0.3198, + "step": 90 + }, + { + "epoch": 0.01, + "learning_rate": 1.86e-07, + "loss": 0.2794, + "step": 95 + }, + { + "epoch": 0.01, + "learning_rate": 1.96e-07, + "loss": 0.368, + "step": 100 + }, + { + "epoch": 0.01, + "learning_rate": 2.04e-07, + "loss": 0.3359, + "step": 105 + }, + { + "epoch": 0.01, + "learning_rate": 2.14e-07, + "loss": 0.3208, + "step": 110 + }, + { + "epoch": 0.01, + "learning_rate": 2.24e-07, + "loss": 0.3115, + "step": 115 + }, + { + "epoch": 0.01, + "learning_rate": 2.34e-07, + "loss": 0.344, + "step": 120 + }, + { + "epoch": 0.01, + "learning_rate": 2.4399999999999996e-07, + "loss": 0.2995, + "step": 125 + }, + { + "epoch": 0.01, + "learning_rate": 2.54e-07, + "loss": 0.3125, + "step": 130 + }, + { + "epoch": 0.01, + "learning_rate": 2.6400000000000003e-07, + "loss": 0.3671, + "step": 135 + }, + { + "epoch": 0.01, + "learning_rate": 2.74e-07, + "loss": 0.3014, + "step": 140 + }, + { + "epoch": 0.01, + "learning_rate": 2.84e-07, + "loss": 0.2985, + "step": 145 + }, + { + "epoch": 0.01, + "learning_rate": 2.94e-07, + "loss": 0.3192, + "step": 150 + }, + { + "epoch": 0.02, + "learning_rate": 3.0399999999999997e-07, + "loss": 0.3205, + "step": 155 + }, + { + "epoch": 0.02, + "learning_rate": 3.1400000000000003e-07, + "loss": 0.2878, + "step": 160 + }, + { + "epoch": 0.02, + "learning_rate": 3.2400000000000004e-07, + "loss": 0.2965, + "step": 165 + }, + { + "epoch": 0.02, + "learning_rate": 3.34e-07, + "loss": 0.3394, + "step": 170 + }, + { + "epoch": 0.02, + "learning_rate": 3.44e-07, + "loss": 0.2886, + "step": 175 + }, + { + "epoch": 0.02, + "learning_rate": 3.54e-07, + "loss": 0.287, + "step": 180 + }, + { + "epoch": 0.02, + "learning_rate": 3.64e-07, + "loss": 0.339, + "step": 185 + }, + { + "epoch": 0.02, + "learning_rate": 3.74e-07, + "loss": 0.3049, + "step": 190 + }, + { + "epoch": 0.02, + "learning_rate": 3.8400000000000005e-07, + "loss": 0.2967, + "step": 195 + }, + { + "epoch": 0.02, + "learning_rate": 3.94e-07, + "loss": 0.3458, + "step": 200 + }, + { + "epoch": 0.02, + "learning_rate": 4.04e-07, + "loss": 0.3283, + "step": 205 + }, + { + "epoch": 0.02, + "learning_rate": 4.1400000000000003e-07, + "loss": 0.3008, + "step": 210 + }, + { + "epoch": 0.02, + "learning_rate": 4.24e-07, + "loss": 0.2842, + "step": 215 + }, + { + "epoch": 0.02, + "learning_rate": 4.34e-07, + "loss": 0.3454, + "step": 220 + }, + { + "epoch": 0.02, + "learning_rate": 4.44e-07, + "loss": 0.2683, + "step": 225 + }, + { + "epoch": 0.02, + "learning_rate": 4.54e-07, + "loss": 0.2992, + "step": 230 + }, + { + "epoch": 0.02, + "learning_rate": 4.64e-07, + "loss": 0.3969, + "step": 235 + }, + { + "epoch": 0.02, + "learning_rate": 4.7400000000000004e-07, + "loss": 0.308, + "step": 240 + }, + { + "epoch": 0.02, + "learning_rate": 4.84e-07, + "loss": 0.2762, + "step": 245 + }, + { + "epoch": 0.02, + "learning_rate": 4.940000000000001e-07, + "loss": 0.3186, + "step": 250 + }, + { + "epoch": 0.02, + "learning_rate": 5.04e-07, + "loss": 0.3062, + "step": 255 + }, + { + "epoch": 0.03, + "learning_rate": 5.140000000000001e-07, + "loss": 0.2716, + "step": 260 + }, + { + "epoch": 0.03, + "learning_rate": 5.24e-07, + "loss": 0.3, + "step": 265 + }, + { + "epoch": 0.03, + "learning_rate": 5.34e-07, + "loss": 0.3274, + "step": 270 + }, + { + "epoch": 0.03, + "learning_rate": 5.44e-07, + "loss": 0.2817, + "step": 275 + }, + { + "epoch": 0.03, + "learning_rate": 5.54e-07, + "loss": 0.2971, + "step": 280 + }, + { + "epoch": 0.03, + "learning_rate": 5.64e-07, + "loss": 0.3433, + "step": 285 + }, + { + "epoch": 0.03, + "learning_rate": 5.739999999999999e-07, + "loss": 0.2809, + "step": 290 + }, + { + "epoch": 0.03, + "learning_rate": 5.84e-07, + "loss": 0.2901, + "step": 295 + }, + { + "epoch": 0.03, + "learning_rate": 5.94e-07, + "loss": 0.2956, + "step": 300 + }, + { + "epoch": 0.03, + "learning_rate": 6.04e-07, + "loss": 0.3311, + "step": 305 + }, + { + "epoch": 0.03, + "learning_rate": 6.140000000000001e-07, + "loss": 0.2591, + "step": 310 + }, + { + "epoch": 0.03, + "learning_rate": 6.24e-07, + "loss": 0.3027, + "step": 315 + }, + { + "epoch": 0.03, + "learning_rate": 6.34e-07, + "loss": 0.3646, + "step": 320 + }, + { + "epoch": 0.03, + "learning_rate": 6.44e-07, + "loss": 0.2757, + "step": 325 + }, + { + "epoch": 0.03, + "learning_rate": 6.54e-07, + "loss": 0.2801, + "step": 330 + }, + { + "epoch": 0.03, + "learning_rate": 6.64e-07, + "loss": 0.3119, + "step": 335 + }, + { + "epoch": 0.03, + "learning_rate": 6.74e-07, + "loss": 0.2802, + "step": 340 + }, + { + "epoch": 0.03, + "learning_rate": 6.84e-07, + "loss": 0.2601, + "step": 345 + }, + { + "epoch": 0.03, + "learning_rate": 6.939999999999999e-07, + "loss": 0.3172, + "step": 350 + }, + { + "epoch": 0.03, + "learning_rate": 7.040000000000001e-07, + "loss": 0.304, + "step": 355 + }, + { + "epoch": 0.04, + "learning_rate": 7.140000000000001e-07, + "loss": 0.2665, + "step": 360 + }, + { + "epoch": 0.04, + "learning_rate": 7.24e-07, + "loss": 0.2602, + "step": 365 + }, + { + "epoch": 0.04, + "learning_rate": 7.340000000000001e-07, + "loss": 0.3047, + "step": 370 + }, + { + "epoch": 0.04, + "learning_rate": 7.44e-07, + "loss": 0.2546, + "step": 375 + }, + { + "epoch": 0.04, + "learning_rate": 7.54e-07, + "loss": 0.289, + "step": 380 + }, + { + "epoch": 0.04, + "learning_rate": 7.64e-07, + "loss": 0.3357, + "step": 385 + }, + { + "epoch": 0.04, + "learning_rate": 7.74e-07, + "loss": 0.2802, + "step": 390 + }, + { + "epoch": 0.04, + "learning_rate": 7.84e-07, + "loss": 0.251, + "step": 395 + }, + { + "epoch": 0.04, + "learning_rate": 7.94e-07, + "loss": 0.3031, + "step": 400 + }, + { + "epoch": 0.04, + "learning_rate": 8.04e-07, + "loss": 0.3216, + "step": 405 + }, + { + "epoch": 0.04, + "learning_rate": 8.14e-07, + "loss": 0.2704, + "step": 410 + }, + { + "epoch": 0.04, + "learning_rate": 8.240000000000001e-07, + "loss": 0.2726, + "step": 415 + }, + { + "epoch": 0.04, + "learning_rate": 8.34e-07, + "loss": 0.3193, + "step": 420 + }, + { + "epoch": 0.04, + "learning_rate": 8.44e-07, + "loss": 0.2705, + "step": 425 + }, + { + "epoch": 0.04, + "learning_rate": 8.540000000000001e-07, + "loss": 0.2798, + "step": 430 + }, + { + "epoch": 0.04, + "learning_rate": 8.64e-07, + "loss": 0.3584, + "step": 435 + }, + { + "epoch": 0.04, + "learning_rate": 8.74e-07, + "loss": 0.2747, + "step": 440 + }, + { + "epoch": 0.04, + "learning_rate": 8.84e-07, + "loss": 0.2658, + "step": 445 + }, + { + "epoch": 0.04, + "learning_rate": 8.94e-07, + "loss": 0.2969, + "step": 450 + }, + { + "epoch": 0.04, + "learning_rate": 9.04e-07, + "loss": 0.312, + "step": 455 + }, + { + "epoch": 0.04, + "learning_rate": 9.140000000000001e-07, + "loss": 0.2484, + "step": 460 + }, + { + "epoch": 0.05, + "learning_rate": 9.240000000000001e-07, + "loss": 0.2783, + "step": 465 + }, + { + "epoch": 0.05, + "learning_rate": 9.34e-07, + "loss": 0.3061, + "step": 470 + }, + { + "epoch": 0.05, + "learning_rate": 9.44e-07, + "loss": 0.268, + "step": 475 + }, + { + "epoch": 0.05, + "learning_rate": 9.54e-07, + "loss": 0.2689, + "step": 480 + }, + { + "epoch": 0.05, + "learning_rate": 9.64e-07, + "loss": 0.3157, + "step": 485 + }, + { + "epoch": 0.05, + "learning_rate": 9.74e-07, + "loss": 0.2956, + "step": 490 + }, + { + "epoch": 0.05, + "learning_rate": 9.84e-07, + "loss": 0.2529, + "step": 495 + }, + { + "epoch": 0.05, + "learning_rate": 9.940000000000001e-07, + "loss": 0.3302, + "step": 500 + }, + { + "epoch": 0.05, + "eval_cer": 0.08888457260718059, + "eval_loss": 0.4542786180973053, + "eval_runtime": 269.2827, + "eval_samples_per_second": 60.791, + "eval_steps_per_second": 1.69, + "eval_wer": 0.23331134952299484, + "step": 500 + }, + { + "epoch": 0.05, + "learning_rate": 1.004e-06, + "loss": 0.3182, + "step": 505 + }, + { + "epoch": 0.05, + "learning_rate": 1.014e-06, + "loss": 0.2778, + "step": 510 + }, + { + "epoch": 0.05, + "learning_rate": 1.024e-06, + "loss": 0.2839, + "step": 515 + }, + { + "epoch": 0.05, + "learning_rate": 1.034e-06, + "loss": 0.3156, + "step": 520 + }, + { + "epoch": 0.05, + "learning_rate": 1.0439999999999999e-06, + "loss": 0.2663, + "step": 525 + }, + { + "epoch": 0.05, + "learning_rate": 1.0540000000000002e-06, + "loss": 0.2894, + "step": 530 + }, + { + "epoch": 0.05, + "learning_rate": 1.064e-06, + "loss": 0.2933, + "step": 535 + }, + { + "epoch": 0.05, + "learning_rate": 1.074e-06, + "loss": 0.2736, + "step": 540 + }, + { + "epoch": 0.05, + "learning_rate": 1.0840000000000001e-06, + "loss": 0.2637, + "step": 545 + }, + { + "epoch": 0.05, + "learning_rate": 1.094e-06, + "loss": 0.2773, + "step": 550 + }, + { + "epoch": 0.05, + "learning_rate": 1.104e-06, + "loss": 0.2872, + "step": 555 + }, + { + "epoch": 0.05, + "learning_rate": 1.114e-06, + "loss": 0.2758, + "step": 560 + }, + { + "epoch": 0.06, + "learning_rate": 1.1240000000000002e-06, + "loss": 0.2824, + "step": 565 + }, + { + "epoch": 0.06, + "learning_rate": 1.134e-06, + "loss": 0.3348, + "step": 570 + }, + { + "epoch": 0.06, + "learning_rate": 1.144e-06, + "loss": 0.2412, + "step": 575 + }, + { + "epoch": 0.06, + "learning_rate": 1.154e-06, + "loss": 0.2371, + "step": 580 + }, + { + "epoch": 0.06, + "learning_rate": 1.164e-06, + "loss": 0.2971, + "step": 585 + }, + { + "epoch": 0.06, + "learning_rate": 1.174e-06, + "loss": 0.3093, + "step": 590 + }, + { + "epoch": 0.06, + "learning_rate": 1.184e-06, + "loss": 0.2638, + "step": 595 + }, + { + "epoch": 0.06, + "learning_rate": 1.1940000000000001e-06, + "loss": 0.2982, + "step": 600 + }, + { + "epoch": 0.06, + "learning_rate": 1.204e-06, + "loss": 0.2878, + "step": 605 + }, + { + "epoch": 0.06, + "learning_rate": 1.214e-06, + "loss": 0.2495, + "step": 610 + }, + { + "epoch": 0.06, + "learning_rate": 1.224e-06, + "loss": 0.2891, + "step": 615 + }, + { + "epoch": 0.06, + "learning_rate": 1.234e-06, + "loss": 0.3404, + "step": 620 + }, + { + "epoch": 0.06, + "learning_rate": 1.244e-06, + "loss": 0.2466, + "step": 625 + }, + { + "epoch": 0.06, + "learning_rate": 1.254e-06, + "loss": 0.2597, + "step": 630 + }, + { + "epoch": 0.06, + "learning_rate": 1.264e-06, + "loss": 0.3075, + "step": 635 + }, + { + "epoch": 0.06, + "learning_rate": 1.274e-06, + "loss": 0.2875, + "step": 640 + }, + { + "epoch": 0.06, + "learning_rate": 1.284e-06, + "loss": 0.2437, + "step": 645 + }, + { + "epoch": 0.06, + "learning_rate": 1.294e-06, + "loss": 0.2762, + "step": 650 + }, + { + "epoch": 0.06, + "learning_rate": 1.3040000000000001e-06, + "loss": 0.2707, + "step": 655 + }, + { + "epoch": 0.06, + "learning_rate": 1.314e-06, + "loss": 0.2579, + "step": 660 + }, + { + "epoch": 0.07, + "learning_rate": 1.324e-06, + "loss": 0.2885, + "step": 665 + }, + { + "epoch": 0.07, + "learning_rate": 1.334e-06, + "loss": 0.313, + "step": 670 + }, + { + "epoch": 0.07, + "learning_rate": 1.344e-06, + "loss": 0.2835, + "step": 675 + }, + { + "epoch": 0.07, + "learning_rate": 1.3539999999999999e-06, + "loss": 0.2703, + "step": 680 + }, + { + "epoch": 0.07, + "learning_rate": 1.3640000000000002e-06, + "loss": 0.2845, + "step": 685 + }, + { + "epoch": 0.07, + "learning_rate": 1.374e-06, + "loss": 0.277, + "step": 690 + }, + { + "epoch": 0.07, + "learning_rate": 1.384e-06, + "loss": 0.2309, + "step": 695 + }, + { + "epoch": 0.07, + "learning_rate": 1.3940000000000001e-06, + "loss": 0.2987, + "step": 700 + }, + { + "epoch": 0.07, + "learning_rate": 1.404e-06, + "loss": 0.2716, + "step": 705 + }, + { + "epoch": 0.07, + "learning_rate": 1.414e-06, + "loss": 0.2687, + "step": 710 + }, + { + "epoch": 0.07, + "learning_rate": 1.424e-06, + "loss": 0.243, + "step": 715 + }, + { + "epoch": 0.07, + "learning_rate": 1.4340000000000002e-06, + "loss": 0.3162, + "step": 720 + }, + { + "epoch": 0.07, + "learning_rate": 1.444e-06, + "loss": 0.3106, + "step": 725 + }, + { + "epoch": 0.07, + "learning_rate": 1.454e-06, + "loss": 0.2836, + "step": 730 + }, + { + "epoch": 0.07, + "learning_rate": 1.464e-06, + "loss": 0.2641, + "step": 735 + }, + { + "epoch": 0.07, + "learning_rate": 1.474e-06, + "loss": 0.2668, + "step": 740 + }, + { + "epoch": 0.07, + "learning_rate": 1.4840000000000001e-06, + "loss": 0.2769, + "step": 745 + }, + { + "epoch": 0.07, + "learning_rate": 1.494e-06, + "loss": 0.2906, + "step": 750 + }, + { + "epoch": 0.07, + "learning_rate": 1.5040000000000001e-06, + "loss": 0.306, + "step": 755 + }, + { + "epoch": 0.07, + "learning_rate": 1.514e-06, + "loss": 0.2567, + "step": 760 + }, + { + "epoch": 0.07, + "learning_rate": 1.524e-06, + "loss": 0.2858, + "step": 765 + }, + { + "epoch": 0.08, + "learning_rate": 1.534e-06, + "loss": 0.3447, + "step": 770 + }, + { + "epoch": 0.08, + "learning_rate": 1.5440000000000002e-06, + "loss": 0.2281, + "step": 775 + }, + { + "epoch": 0.08, + "learning_rate": 1.554e-06, + "loss": 0.2636, + "step": 780 + }, + { + "epoch": 0.08, + "learning_rate": 1.564e-06, + "loss": 0.2851, + "step": 785 + }, + { + "epoch": 0.08, + "learning_rate": 1.574e-06, + "loss": 0.2653, + "step": 790 + }, + { + "epoch": 0.08, + "learning_rate": 1.584e-06, + "loss": 0.2519, + "step": 795 + }, + { + "epoch": 0.08, + "learning_rate": 1.594e-06, + "loss": 0.2857, + "step": 800 + }, + { + "epoch": 0.08, + "learning_rate": 1.604e-06, + "loss": 0.2833, + "step": 805 + }, + { + "epoch": 0.08, + "learning_rate": 1.6140000000000001e-06, + "loss": 0.2472, + "step": 810 + }, + { + "epoch": 0.08, + "learning_rate": 1.624e-06, + "loss": 0.2815, + "step": 815 + }, + { + "epoch": 0.08, + "learning_rate": 1.634e-06, + "loss": 0.3402, + "step": 820 + }, + { + "epoch": 0.08, + "learning_rate": 1.644e-06, + "loss": 0.2439, + "step": 825 + }, + { + "epoch": 0.08, + "learning_rate": 1.654e-06, + "loss": 0.2629, + "step": 830 + }, + { + "epoch": 0.08, + "learning_rate": 1.6639999999999999e-06, + "loss": 0.3033, + "step": 835 + }, + { + "epoch": 0.08, + "learning_rate": 1.6740000000000002e-06, + "loss": 0.2698, + "step": 840 + }, + { + "epoch": 0.08, + "learning_rate": 1.684e-06, + "loss": 0.2507, + "step": 845 + }, + { + "epoch": 0.08, + "learning_rate": 1.694e-06, + "loss": 0.2879, + "step": 850 + }, + { + "epoch": 0.08, + "learning_rate": 1.7040000000000001e-06, + "loss": 0.2841, + "step": 855 + }, + { + "epoch": 0.08, + "learning_rate": 1.714e-06, + "loss": 0.2503, + "step": 860 + }, + { + "epoch": 0.08, + "learning_rate": 1.724e-06, + "loss": 0.2776, + "step": 865 + }, + { + "epoch": 0.09, + "learning_rate": 1.734e-06, + "loss": 0.2849, + "step": 870 + }, + { + "epoch": 0.09, + "learning_rate": 1.7440000000000002e-06, + "loss": 0.2665, + "step": 875 + }, + { + "epoch": 0.09, + "learning_rate": 1.754e-06, + "loss": 0.2663, + "step": 880 + }, + { + "epoch": 0.09, + "learning_rate": 1.764e-06, + "loss": 0.2954, + "step": 885 + }, + { + "epoch": 0.09, + "learning_rate": 1.774e-06, + "loss": 0.2697, + "step": 890 + }, + { + "epoch": 0.09, + "learning_rate": 1.784e-06, + "loss": 0.2573, + "step": 895 + }, + { + "epoch": 0.09, + "learning_rate": 1.794e-06, + "loss": 0.2872, + "step": 900 + }, + { + "epoch": 0.09, + "learning_rate": 1.804e-06, + "loss": 0.2793, + "step": 905 + }, + { + "epoch": 0.09, + "learning_rate": 1.8140000000000001e-06, + "loss": 0.2318, + "step": 910 + }, + { + "epoch": 0.09, + "learning_rate": 1.824e-06, + "loss": 0.259, + "step": 915 + }, + { + "epoch": 0.09, + "learning_rate": 1.834e-06, + "loss": 0.2816, + "step": 920 + }, + { + "epoch": 0.09, + "learning_rate": 1.844e-06, + "loss": 0.2662, + "step": 925 + }, + { + "epoch": 0.09, + "learning_rate": 1.8540000000000002e-06, + "loss": 0.2481, + "step": 930 + }, + { + "epoch": 0.09, + "learning_rate": 1.864e-06, + "loss": 0.287, + "step": 935 + }, + { + "epoch": 0.09, + "learning_rate": 1.874e-06, + "loss": 0.2475, + "step": 940 + }, + { + "epoch": 0.09, + "learning_rate": 1.8839999999999999e-06, + "loss": 0.2331, + "step": 945 + }, + { + "epoch": 0.09, + "learning_rate": 1.894e-06, + "loss": 0.293, + "step": 950 + }, + { + "epoch": 0.09, + "learning_rate": 1.9040000000000001e-06, + "loss": 0.2846, + "step": 955 + }, + { + "epoch": 0.09, + "learning_rate": 1.914e-06, + "loss": 0.2318, + "step": 960 + }, + { + "epoch": 0.09, + "learning_rate": 1.924e-06, + "loss": 0.2424, + "step": 965 + }, + { + "epoch": 0.09, + "learning_rate": 1.934e-06, + "loss": 0.3075, + "step": 970 + }, + { + "epoch": 0.1, + "learning_rate": 1.944e-06, + "loss": 0.2622, + "step": 975 + }, + { + "epoch": 0.1, + "learning_rate": 1.9540000000000003e-06, + "loss": 0.2683, + "step": 980 + }, + { + "epoch": 0.1, + "learning_rate": 1.964e-06, + "loss": 0.26, + "step": 985 + }, + { + "epoch": 0.1, + "learning_rate": 1.974e-06, + "loss": 0.2478, + "step": 990 + }, + { + "epoch": 0.1, + "learning_rate": 1.984e-06, + "loss": 0.2337, + "step": 995 + }, + { + "epoch": 0.1, + "learning_rate": 1.994e-06, + "loss": 0.2579, + "step": 1000 + }, + { + "epoch": 0.1, + "eval_cer": 0.08320211066175535, + "eval_loss": 0.41720014810562134, + "eval_runtime": 329.6449, + "eval_samples_per_second": 49.659, + "eval_steps_per_second": 1.38, + "eval_wer": 0.22127031597918287, + "step": 1000 + }, + { + "epoch": 0.1, + "learning_rate": 2.004e-06, + "loss": 0.2718, + "step": 1005 + }, + { + "epoch": 0.1, + "learning_rate": 2.014e-06, + "loss": 0.2508, + "step": 1010 + }, + { + "epoch": 0.1, + "learning_rate": 2.024e-06, + "loss": 0.2363, + "step": 1015 + }, + { + "epoch": 0.1, + "learning_rate": 2.034e-06, + "loss": 0.3118, + "step": 1020 + }, + { + "epoch": 0.1, + "learning_rate": 2.0440000000000003e-06, + "loss": 0.2413, + "step": 1025 + }, + { + "epoch": 0.1, + "learning_rate": 2.0539999999999997e-06, + "loss": 0.2375, + "step": 1030 + }, + { + "epoch": 0.1, + "learning_rate": 2.064e-06, + "loss": 0.3097, + "step": 1035 + }, + { + "epoch": 0.1, + "learning_rate": 2.0740000000000004e-06, + "loss": 0.2556, + "step": 1040 + }, + { + "epoch": 0.1, + "learning_rate": 2.084e-06, + "loss": 0.2252, + "step": 1045 + }, + { + "epoch": 0.1, + "learning_rate": 2.094e-06, + "loss": 0.3137, + "step": 1050 + }, + { + "epoch": 0.1, + "learning_rate": 2.104e-06, + "loss": 0.2815, + "step": 1055 + }, + { + "epoch": 0.1, + "learning_rate": 2.114e-06, + "loss": 0.2271, + "step": 1060 + }, + { + "epoch": 0.1, + "learning_rate": 2.124e-06, + "loss": 0.2375, + "step": 1065 + }, + { + "epoch": 0.1, + "learning_rate": 2.1340000000000002e-06, + "loss": 0.2858, + "step": 1070 + }, + { + "epoch": 0.11, + "learning_rate": 2.144e-06, + "loss": 0.2339, + "step": 1075 + }, + { + "epoch": 0.11, + "learning_rate": 2.154e-06, + "loss": 0.2573, + "step": 1080 + }, + { + "epoch": 0.11, + "learning_rate": 2.164e-06, + "loss": 0.3153, + "step": 1085 + }, + { + "epoch": 0.11, + "learning_rate": 2.174e-06, + "loss": 0.2406, + "step": 1090 + }, + { + "epoch": 0.11, + "learning_rate": 2.184e-06, + "loss": 0.2325, + "step": 1095 + }, + { + "epoch": 0.11, + "learning_rate": 2.194e-06, + "loss": 0.269, + "step": 1100 + }, + { + "epoch": 0.11, + "learning_rate": 2.204e-06, + "loss": 0.2462, + "step": 1105 + }, + { + "epoch": 0.11, + "learning_rate": 2.2140000000000003e-06, + "loss": 0.2386, + "step": 1110 + }, + { + "epoch": 0.11, + "learning_rate": 2.224e-06, + "loss": 0.282, + "step": 1115 + }, + { + "epoch": 0.11, + "learning_rate": 2.234e-06, + "loss": 0.255, + "step": 1120 + }, + { + "epoch": 0.11, + "learning_rate": 2.244e-06, + "loss": 0.2556, + "step": 1125 + }, + { + "epoch": 0.11, + "learning_rate": 2.254e-06, + "loss": 0.2423, + "step": 1130 + }, + { + "epoch": 0.11, + "learning_rate": 2.2640000000000003e-06, + "loss": 0.3072, + "step": 1135 + }, + { + "epoch": 0.11, + "learning_rate": 2.274e-06, + "loss": 0.2656, + "step": 1140 + }, + { + "epoch": 0.11, + "learning_rate": 2.284e-06, + "loss": 0.2564, + "step": 1145 + }, + { + "epoch": 0.11, + "learning_rate": 2.294e-06, + "loss": 0.294, + "step": 1150 + }, + { + "epoch": 0.11, + "learning_rate": 2.304e-06, + "loss": 0.2584, + "step": 1155 + }, + { + "epoch": 0.11, + "learning_rate": 2.314e-06, + "loss": 0.2533, + "step": 1160 + }, + { + "epoch": 0.11, + "learning_rate": 2.324e-06, + "loss": 0.2303, + "step": 1165 + }, + { + "epoch": 0.11, + "learning_rate": 2.334e-06, + "loss": 0.2649, + "step": 1170 + }, + { + "epoch": 0.11, + "learning_rate": 2.344e-06, + "loss": 0.2415, + "step": 1175 + }, + { + "epoch": 0.12, + "learning_rate": 2.3540000000000002e-06, + "loss": 0.2423, + "step": 1180 + }, + { + "epoch": 0.12, + "learning_rate": 2.3639999999999997e-06, + "loss": 0.2733, + "step": 1185 + }, + { + "epoch": 0.12, + "learning_rate": 2.374e-06, + "loss": 0.2355, + "step": 1190 + }, + { + "epoch": 0.12, + "learning_rate": 2.3840000000000004e-06, + "loss": 0.2388, + "step": 1195 + }, + { + "epoch": 0.12, + "learning_rate": 2.394e-06, + "loss": 0.2832, + "step": 1200 + }, + { + "epoch": 0.12, + "learning_rate": 2.404e-06, + "loss": 0.2683, + "step": 1205 + }, + { + "epoch": 0.12, + "learning_rate": 2.414e-06, + "loss": 0.2401, + "step": 1210 + }, + { + "epoch": 0.12, + "learning_rate": 2.424e-06, + "loss": 0.2454, + "step": 1215 + }, + { + "epoch": 0.12, + "learning_rate": 2.434e-06, + "loss": 0.2777, + "step": 1220 + }, + { + "epoch": 0.12, + "learning_rate": 2.4440000000000002e-06, + "loss": 0.2571, + "step": 1225 + }, + { + "epoch": 0.12, + "learning_rate": 2.454e-06, + "loss": 0.2464, + "step": 1230 + }, + { + "epoch": 0.12, + "learning_rate": 2.464e-06, + "loss": 0.2735, + "step": 1235 + }, + { + "epoch": 0.12, + "learning_rate": 2.474e-06, + "loss": 0.246, + "step": 1240 + }, + { + "epoch": 0.12, + "learning_rate": 2.484e-06, + "loss": 0.2552, + "step": 1245 + }, + { + "epoch": 0.12, + "learning_rate": 2.494e-06, + "loss": 0.2693, + "step": 1250 + }, + { + "epoch": 0.12, + "learning_rate": 2.504e-06, + "loss": 0.2534, + "step": 1255 + }, + { + "epoch": 0.12, + "learning_rate": 2.514e-06, + "loss": 0.2208, + "step": 1260 + }, + { + "epoch": 0.12, + "learning_rate": 2.5240000000000003e-06, + "loss": 0.2248, + "step": 1265 + }, + { + "epoch": 0.12, + "learning_rate": 2.534e-06, + "loss": 0.2907, + "step": 1270 + }, + { + "epoch": 0.12, + "learning_rate": 2.544e-06, + "loss": 0.2172, + "step": 1275 + }, + { + "epoch": 0.13, + "learning_rate": 2.554e-06, + "loss": 0.2448, + "step": 1280 + }, + { + "epoch": 0.13, + "learning_rate": 2.564e-06, + "loss": 0.3114, + "step": 1285 + }, + { + "epoch": 0.13, + "learning_rate": 2.5740000000000003e-06, + "loss": 0.2575, + "step": 1290 + }, + { + "epoch": 0.13, + "learning_rate": 2.584e-06, + "loss": 0.2471, + "step": 1295 + }, + { + "epoch": 0.13, + "learning_rate": 2.594e-06, + "loss": 0.2595, + "step": 1300 + }, + { + "epoch": 0.13, + "learning_rate": 2.604e-06, + "loss": 0.3037, + "step": 1305 + }, + { + "epoch": 0.13, + "learning_rate": 2.614e-06, + "loss": 0.241, + "step": 1310 + }, + { + "epoch": 0.13, + "learning_rate": 2.624e-06, + "loss": 0.2491, + "step": 1315 + }, + { + "epoch": 0.13, + "learning_rate": 2.634e-06, + "loss": 0.2699, + "step": 1320 + }, + { + "epoch": 0.13, + "learning_rate": 2.644e-06, + "loss": 0.2376, + "step": 1325 + }, + { + "epoch": 0.13, + "learning_rate": 2.654e-06, + "loss": 0.2629, + "step": 1330 + }, + { + "epoch": 0.13, + "learning_rate": 2.6640000000000002e-06, + "loss": 0.2839, + "step": 1335 + }, + { + "epoch": 0.13, + "learning_rate": 2.6739999999999997e-06, + "loss": 0.235, + "step": 1340 + }, + { + "epoch": 0.13, + "learning_rate": 2.684e-06, + "loss": 0.2314, + "step": 1345 + }, + { + "epoch": 0.13, + "learning_rate": 2.6940000000000004e-06, + "loss": 0.2549, + "step": 1350 + }, + { + "epoch": 0.13, + "learning_rate": 2.704e-06, + "loss": 0.2582, + "step": 1355 + }, + { + "epoch": 0.13, + "learning_rate": 2.714e-06, + "loss": 0.224, + "step": 1360 + }, + { + "epoch": 0.13, + "learning_rate": 2.724e-06, + "loss": 0.2468, + "step": 1365 + }, + { + "epoch": 0.13, + "learning_rate": 2.734e-06, + "loss": 0.2717, + "step": 1370 + }, + { + "epoch": 0.13, + "learning_rate": 2.7440000000000003e-06, + "loss": 0.2405, + "step": 1375 + }, + { + "epoch": 0.13, + "learning_rate": 2.7540000000000002e-06, + "loss": 0.2611, + "step": 1380 + }, + { + "epoch": 0.14, + "learning_rate": 2.764e-06, + "loss": 0.2709, + "step": 1385 + }, + { + "epoch": 0.14, + "learning_rate": 2.774e-06, + "loss": 0.2402, + "step": 1390 + }, + { + "epoch": 0.14, + "learning_rate": 2.784e-06, + "loss": 0.2461, + "step": 1395 + }, + { + "epoch": 0.14, + "learning_rate": 2.794e-06, + "loss": 0.2729, + "step": 1400 + }, + { + "epoch": 0.14, + "learning_rate": 2.804e-06, + "loss": 0.2541, + "step": 1405 + }, + { + "epoch": 0.14, + "learning_rate": 2.814e-06, + "loss": 0.214, + "step": 1410 + }, + { + "epoch": 0.14, + "learning_rate": 2.824e-06, + "loss": 0.2706, + "step": 1415 + }, + { + "epoch": 0.14, + "learning_rate": 2.8340000000000003e-06, + "loss": 0.2737, + "step": 1420 + }, + { + "epoch": 0.14, + "learning_rate": 2.844e-06, + "loss": 0.2496, + "step": 1425 + }, + { + "epoch": 0.14, + "learning_rate": 2.854e-06, + "loss": 0.2342, + "step": 1430 + }, + { + "epoch": 0.14, + "learning_rate": 2.864e-06, + "loss": 0.2919, + "step": 1435 + }, + { + "epoch": 0.14, + "learning_rate": 2.874e-06, + "loss": 0.2376, + "step": 1440 + }, + { + "epoch": 0.14, + "learning_rate": 2.8840000000000003e-06, + "loss": 0.2364, + "step": 1445 + }, + { + "epoch": 0.14, + "learning_rate": 2.894e-06, + "loss": 0.2638, + "step": 1450 + }, + { + "epoch": 0.14, + "learning_rate": 2.904e-06, + "loss": 0.2783, + "step": 1455 + }, + { + "epoch": 0.14, + "learning_rate": 2.914e-06, + "loss": 0.2091, + "step": 1460 + }, + { + "epoch": 0.14, + "learning_rate": 2.924e-06, + "loss": 0.2424, + "step": 1465 + }, + { + "epoch": 0.14, + "learning_rate": 2.934e-06, + "loss": 0.2606, + "step": 1470 + }, + { + "epoch": 0.14, + "learning_rate": 2.944e-06, + "loss": 0.2399, + "step": 1475 + }, + { + "epoch": 0.14, + "learning_rate": 2.954e-06, + "loss": 0.232, + "step": 1480 + }, + { + "epoch": 0.15, + "learning_rate": 2.964e-06, + "loss": 0.2538, + "step": 1485 + }, + { + "epoch": 0.15, + "learning_rate": 2.9740000000000002e-06, + "loss": 0.2347, + "step": 1490 + }, + { + "epoch": 0.15, + "learning_rate": 2.9839999999999997e-06, + "loss": 0.2548, + "step": 1495 + }, + { + "epoch": 0.15, + "learning_rate": 2.994e-06, + "loss": 0.2527, + "step": 1500 + }, + { + "epoch": 0.15, + "eval_cer": 0.07988743753916448, + "eval_loss": 0.3998512327671051, + "eval_runtime": 272.2231, + "eval_samples_per_second": 60.135, + "eval_steps_per_second": 1.671, + "eval_wer": 0.21421808375178755, + "step": 1500 + }, + { + "epoch": 0.15, + "learning_rate": 3.0040000000000004e-06, + "loss": 0.2444, + "step": 1505 + }, + { + "epoch": 0.15, + "learning_rate": 3.014e-06, + "loss": 0.2232, + "step": 1510 + }, + { + "epoch": 0.15, + "learning_rate": 3.024e-06, + "loss": 0.2533, + "step": 1515 + }, + { + "epoch": 0.15, + "learning_rate": 3.034e-06, + "loss": 0.2584, + "step": 1520 + }, + { + "epoch": 0.15, + "learning_rate": 3.044e-06, + "loss": 0.2311, + "step": 1525 + }, + { + "epoch": 0.15, + "learning_rate": 3.0540000000000003e-06, + "loss": 0.2316, + "step": 1530 + }, + { + "epoch": 0.15, + "learning_rate": 3.0640000000000002e-06, + "loss": 0.2767, + "step": 1535 + }, + { + "epoch": 0.15, + "learning_rate": 3.074e-06, + "loss": 0.2421, + "step": 1540 + }, + { + "epoch": 0.15, + "learning_rate": 3.084e-06, + "loss": 0.2197, + "step": 1545 + }, + { + "epoch": 0.15, + "learning_rate": 3.094e-06, + "loss": 0.2471, + "step": 1550 + }, + { + "epoch": 0.15, + "learning_rate": 3.104e-06, + "loss": 0.2536, + "step": 1555 + }, + { + "epoch": 0.15, + "learning_rate": 3.114e-06, + "loss": 0.229, + "step": 1560 + }, + { + "epoch": 0.15, + "learning_rate": 3.124e-06, + "loss": 0.2383, + "step": 1565 + }, + { + "epoch": 0.15, + "learning_rate": 3.134e-06, + "loss": 0.2697, + "step": 1570 + }, + { + "epoch": 0.15, + "learning_rate": 3.1440000000000003e-06, + "loss": 0.2518, + "step": 1575 + }, + { + "epoch": 0.15, + "learning_rate": 3.1539999999999998e-06, + "loss": 0.2322, + "step": 1580 + }, + { + "epoch": 0.15, + "learning_rate": 3.164e-06, + "loss": 0.2755, + "step": 1585 + }, + { + "epoch": 0.16, + "learning_rate": 3.1740000000000004e-06, + "loss": 0.2353, + "step": 1590 + }, + { + "epoch": 0.16, + "learning_rate": 3.184e-06, + "loss": 0.2146, + "step": 1595 + }, + { + "epoch": 0.16, + "learning_rate": 3.1940000000000003e-06, + "loss": 0.2641, + "step": 1600 + }, + { + "epoch": 0.16, + "learning_rate": 3.204e-06, + "loss": 0.2361, + "step": 1605 + }, + { + "epoch": 0.16, + "learning_rate": 3.214e-06, + "loss": 0.212, + "step": 1610 + }, + { + "epoch": 0.16, + "learning_rate": 3.224e-06, + "loss": 0.252, + "step": 1615 + }, + { + "epoch": 0.16, + "learning_rate": 3.2340000000000003e-06, + "loss": 0.2948, + "step": 1620 + }, + { + "epoch": 0.16, + "learning_rate": 3.244e-06, + "loss": 0.2324, + "step": 1625 + }, + { + "epoch": 0.16, + "learning_rate": 3.254e-06, + "loss": 0.2259, + "step": 1630 + }, + { + "epoch": 0.16, + "learning_rate": 3.264e-06, + "loss": 0.2646, + "step": 1635 + }, + { + "epoch": 0.16, + "learning_rate": 3.274e-06, + "loss": 0.2208, + "step": 1640 + }, + { + "epoch": 0.16, + "learning_rate": 3.2840000000000002e-06, + "loss": 0.217, + "step": 1645 + }, + { + "epoch": 0.16, + "learning_rate": 3.2939999999999997e-06, + "loss": 0.2564, + "step": 1650 + }, + { + "epoch": 0.16, + "learning_rate": 3.304e-06, + "loss": 0.2538, + "step": 1655 + }, + { + "epoch": 0.16, + "learning_rate": 3.3140000000000004e-06, + "loss": 0.2309, + "step": 1660 + }, + { + "epoch": 0.16, + "learning_rate": 3.324e-06, + "loss": 0.2305, + "step": 1665 + }, + { + "epoch": 0.16, + "learning_rate": 3.334e-06, + "loss": 0.2475, + "step": 1670 + }, + { + "epoch": 0.16, + "learning_rate": 3.344e-06, + "loss": 0.1965, + "step": 1675 + }, + { + "epoch": 0.16, + "learning_rate": 3.354e-06, + "loss": 0.2382, + "step": 1680 + }, + { + "epoch": 0.16, + "learning_rate": 3.3640000000000003e-06, + "loss": 0.2604, + "step": 1685 + }, + { + "epoch": 0.17, + "learning_rate": 3.3740000000000002e-06, + "loss": 0.214, + "step": 1690 + }, + { + "epoch": 0.17, + "learning_rate": 3.384e-06, + "loss": 0.2296, + "step": 1695 + }, + { + "epoch": 0.17, + "learning_rate": 3.394e-06, + "loss": 0.2415, + "step": 1700 + }, + { + "epoch": 0.17, + "learning_rate": 3.404e-06, + "loss": 0.2599, + "step": 1705 + }, + { + "epoch": 0.17, + "learning_rate": 3.414e-06, + "loss": 0.225, + "step": 1710 + }, + { + "epoch": 0.17, + "learning_rate": 3.424e-06, + "loss": 0.2263, + "step": 1715 + }, + { + "epoch": 0.17, + "learning_rate": 3.434e-06, + "loss": 0.2415, + "step": 1720 + }, + { + "epoch": 0.17, + "learning_rate": 3.444e-06, + "loss": 0.2331, + "step": 1725 + }, + { + "epoch": 0.17, + "learning_rate": 3.4540000000000003e-06, + "loss": 0.2257, + "step": 1730 + }, + { + "epoch": 0.17, + "learning_rate": 3.4639999999999998e-06, + "loss": 0.3014, + "step": 1735 + }, + { + "epoch": 0.17, + "learning_rate": 3.474e-06, + "loss": 0.2326, + "step": 1740 + }, + { + "epoch": 0.17, + "learning_rate": 3.4840000000000004e-06, + "loss": 0.2342, + "step": 1745 + }, + { + "epoch": 0.17, + "learning_rate": 3.494e-06, + "loss": 0.2692, + "step": 1750 + }, + { + "epoch": 0.17, + "learning_rate": 3.5040000000000002e-06, + "loss": 0.253, + "step": 1755 + }, + { + "epoch": 0.17, + "learning_rate": 3.514e-06, + "loss": 0.2247, + "step": 1760 + }, + { + "epoch": 0.17, + "learning_rate": 3.524e-06, + "loss": 0.229, + "step": 1765 + }, + { + "epoch": 0.17, + "learning_rate": 3.534e-06, + "loss": 0.2588, + "step": 1770 + }, + { + "epoch": 0.17, + "learning_rate": 3.5440000000000003e-06, + "loss": 0.2151, + "step": 1775 + }, + { + "epoch": 0.17, + "learning_rate": 3.554e-06, + "loss": 0.2285, + "step": 1780 + }, + { + "epoch": 0.17, + "learning_rate": 3.564e-06, + "loss": 0.2791, + "step": 1785 + }, + { + "epoch": 0.18, + "learning_rate": 3.574e-06, + "loss": 0.2261, + "step": 1790 + }, + { + "epoch": 0.18, + "learning_rate": 3.584e-06, + "loss": 0.2128, + "step": 1795 + }, + { + "epoch": 0.18, + "learning_rate": 3.5940000000000002e-06, + "loss": 0.2496, + "step": 1800 + }, + { + "epoch": 0.18, + "learning_rate": 3.604e-06, + "loss": 0.2613, + "step": 1805 + }, + { + "epoch": 0.18, + "learning_rate": 3.614e-06, + "loss": 0.2231, + "step": 1810 + }, + { + "epoch": 0.18, + "learning_rate": 3.6240000000000004e-06, + "loss": 0.2332, + "step": 1815 + }, + { + "epoch": 0.18, + "learning_rate": 3.634e-06, + "loss": 0.2638, + "step": 1820 + }, + { + "epoch": 0.18, + "learning_rate": 3.644e-06, + "loss": 0.2512, + "step": 1825 + }, + { + "epoch": 0.18, + "learning_rate": 3.654e-06, + "loss": 0.25, + "step": 1830 + }, + { + "epoch": 0.18, + "learning_rate": 3.664e-06, + "loss": 0.2676, + "step": 1835 + }, + { + "epoch": 0.18, + "learning_rate": 3.6740000000000003e-06, + "loss": 0.2348, + "step": 1840 + }, + { + "epoch": 0.18, + "learning_rate": 3.6840000000000002e-06, + "loss": 0.22, + "step": 1845 + }, + { + "epoch": 0.18, + "learning_rate": 3.694e-06, + "loss": 0.2337, + "step": 1850 + }, + { + "epoch": 0.18, + "learning_rate": 3.704e-06, + "loss": 0.2159, + "step": 1855 + }, + { + "epoch": 0.18, + "learning_rate": 3.714e-06, + "loss": 0.2138, + "step": 1860 + }, + { + "epoch": 0.18, + "learning_rate": 3.724e-06, + "loss": 0.2568, + "step": 1865 + }, + { + "epoch": 0.18, + "learning_rate": 3.734e-06, + "loss": 0.2541, + "step": 1870 + }, + { + "epoch": 0.18, + "learning_rate": 3.744e-06, + "loss": 0.2142, + "step": 1875 + }, + { + "epoch": 0.18, + "learning_rate": 3.7540000000000004e-06, + "loss": 0.2228, + "step": 1880 + }, + { + "epoch": 0.18, + "learning_rate": 3.7640000000000003e-06, + "loss": 0.2607, + "step": 1885 + }, + { + "epoch": 0.18, + "learning_rate": 3.7739999999999998e-06, + "loss": 0.2303, + "step": 1890 + }, + { + "epoch": 0.19, + "learning_rate": 3.7839999999999997e-06, + "loss": 0.2286, + "step": 1895 + }, + { + "epoch": 0.19, + "learning_rate": 3.7940000000000004e-06, + "loss": 0.2515, + "step": 1900 + }, + { + "epoch": 0.19, + "learning_rate": 3.804e-06, + "loss": 0.2371, + "step": 1905 + }, + { + "epoch": 0.19, + "learning_rate": 3.814e-06, + "loss": 0.2188, + "step": 1910 + }, + { + "epoch": 0.19, + "learning_rate": 3.824e-06, + "loss": 0.222, + "step": 1915 + }, + { + "epoch": 0.19, + "learning_rate": 3.834e-06, + "loss": 0.2845, + "step": 1920 + }, + { + "epoch": 0.19, + "learning_rate": 3.844e-06, + "loss": 0.2234, + "step": 1925 + }, + { + "epoch": 0.19, + "learning_rate": 3.854000000000001e-06, + "loss": 0.2222, + "step": 1930 + }, + { + "epoch": 0.19, + "learning_rate": 3.864e-06, + "loss": 0.2729, + "step": 1935 + }, + { + "epoch": 0.19, + "learning_rate": 3.874e-06, + "loss": 0.2093, + "step": 1940 + }, + { + "epoch": 0.19, + "learning_rate": 3.884e-06, + "loss": 0.2121, + "step": 1945 + }, + { + "epoch": 0.19, + "learning_rate": 3.894e-06, + "loss": 0.256, + "step": 1950 + }, + { + "epoch": 0.19, + "learning_rate": 3.903999999999999e-06, + "loss": 0.2377, + "step": 1955 + }, + { + "epoch": 0.19, + "learning_rate": 3.914e-06, + "loss": 0.1932, + "step": 1960 + }, + { + "epoch": 0.19, + "learning_rate": 3.924e-06, + "loss": 0.2632, + "step": 1965 + }, + { + "epoch": 0.19, + "learning_rate": 3.934e-06, + "loss": 0.2552, + "step": 1970 + }, + { + "epoch": 0.19, + "learning_rate": 3.944000000000001e-06, + "loss": 0.211, + "step": 1975 + }, + { + "epoch": 0.19, + "learning_rate": 3.954e-06, + "loss": 0.2257, + "step": 1980 + }, + { + "epoch": 0.19, + "learning_rate": 3.964e-06, + "loss": 0.261, + "step": 1985 + }, + { + "epoch": 0.19, + "learning_rate": 3.974e-06, + "loss": 0.2248, + "step": 1990 + }, + { + "epoch": 0.2, + "learning_rate": 3.984e-06, + "loss": 0.219, + "step": 1995 + }, + { + "epoch": 0.2, + "learning_rate": 3.994e-06, + "loss": 0.269, + "step": 2000 + }, + { + "epoch": 0.2, + "eval_cer": 0.07679358847182817, + "eval_loss": 0.3763008415699005, + "eval_runtime": 270.4089, + "eval_samples_per_second": 60.538, + "eval_steps_per_second": 1.683, + "eval_wer": 0.20493917449703872, + "step": 2000 + }, + { + "epoch": 0.2, + "learning_rate": 4.004e-06, + "loss": 0.2553, + "step": 2005 + }, + { + "epoch": 0.2, + "learning_rate": 4.014e-06, + "loss": 0.2147, + "step": 2010 + }, + { + "epoch": 0.2, + "learning_rate": 4.024e-06, + "loss": 0.2378, + "step": 2015 + }, + { + "epoch": 0.2, + "learning_rate": 4.034000000000001e-06, + "loss": 0.22, + "step": 2020 + }, + { + "epoch": 0.2, + "learning_rate": 4.044000000000001e-06, + "loss": 0.2211, + "step": 2025 + }, + { + "epoch": 0.2, + "learning_rate": 4.054e-06, + "loss": 0.2114, + "step": 2030 + }, + { + "epoch": 0.2, + "learning_rate": 4.064e-06, + "loss": 0.2683, + "step": 2035 + }, + { + "epoch": 0.2, + "learning_rate": 4.074e-06, + "loss": 0.2408, + "step": 2040 + }, + { + "epoch": 0.2, + "learning_rate": 4.084e-06, + "loss": 0.205, + "step": 2045 + }, + { + "epoch": 0.2, + "learning_rate": 4.094e-06, + "loss": 0.2696, + "step": 2050 + }, + { + "epoch": 0.2, + "learning_rate": 4.104e-06, + "loss": 0.2309, + "step": 2055 + }, + { + "epoch": 0.2, + "learning_rate": 4.114e-06, + "loss": 0.2161, + "step": 2060 + }, + { + "epoch": 0.2, + "learning_rate": 4.124e-06, + "loss": 0.2054, + "step": 2065 + }, + { + "epoch": 0.2, + "learning_rate": 4.1340000000000006e-06, + "loss": 0.2332, + "step": 2070 + }, + { + "epoch": 0.2, + "learning_rate": 4.144e-06, + "loss": 0.2085, + "step": 2075 + }, + { + "epoch": 0.2, + "learning_rate": 4.1539999999999995e-06, + "loss": 0.21, + "step": 2080 + }, + { + "epoch": 0.2, + "learning_rate": 4.164e-06, + "loss": 0.265, + "step": 2085 + }, + { + "epoch": 0.2, + "learning_rate": 4.174e-06, + "loss": 0.209, + "step": 2090 + }, + { + "epoch": 0.2, + "learning_rate": 4.184e-06, + "loss": 0.2171, + "step": 2095 + }, + { + "epoch": 0.21, + "learning_rate": 4.194e-06, + "loss": 0.2387, + "step": 2100 + }, + { + "epoch": 0.21, + "learning_rate": 4.204e-06, + "loss": 0.246, + "step": 2105 + }, + { + "epoch": 0.21, + "learning_rate": 4.214e-06, + "loss": 0.2017, + "step": 2110 + }, + { + "epoch": 0.21, + "learning_rate": 4.2240000000000006e-06, + "loss": 0.2304, + "step": 2115 + }, + { + "epoch": 0.21, + "learning_rate": 4.2340000000000005e-06, + "loss": 0.258, + "step": 2120 + }, + { + "epoch": 0.21, + "learning_rate": 4.2439999999999995e-06, + "loss": 0.2308, + "step": 2125 + }, + { + "epoch": 0.21, + "learning_rate": 4.254e-06, + "loss": 0.2222, + "step": 2130 + }, + { + "epoch": 0.21, + "learning_rate": 4.264e-06, + "loss": 0.263, + "step": 2135 + }, + { + "epoch": 0.21, + "learning_rate": 4.274e-06, + "loss": 0.2156, + "step": 2140 + }, + { + "epoch": 0.21, + "learning_rate": 4.284000000000001e-06, + "loss": 0.2284, + "step": 2145 + }, + { + "epoch": 0.21, + "learning_rate": 4.294e-06, + "loss": 0.2206, + "step": 2150 + }, + { + "epoch": 0.21, + "learning_rate": 4.304e-06, + "loss": 0.2372, + "step": 2155 + }, + { + "epoch": 0.21, + "learning_rate": 4.3140000000000005e-06, + "loss": 0.2124, + "step": 2160 + }, + { + "epoch": 0.21, + "learning_rate": 4.3240000000000004e-06, + "loss": 0.243, + "step": 2165 + }, + { + "epoch": 0.21, + "learning_rate": 4.3339999999999995e-06, + "loss": 0.2586, + "step": 2170 + }, + { + "epoch": 0.21, + "learning_rate": 4.344e-06, + "loss": 0.2177, + "step": 2175 + }, + { + "epoch": 0.21, + "learning_rate": 4.354e-06, + "loss": 0.2097, + "step": 2180 + }, + { + "epoch": 0.21, + "learning_rate": 4.364e-06, + "loss": 0.2384, + "step": 2185 + }, + { + "epoch": 0.21, + "learning_rate": 4.374000000000001e-06, + "loss": 0.2153, + "step": 2190 + }, + { + "epoch": 0.21, + "learning_rate": 4.384e-06, + "loss": 0.2238, + "step": 2195 + }, + { + "epoch": 0.22, + "learning_rate": 4.394e-06, + "loss": 0.2418, + "step": 2200 + }, + { + "epoch": 0.22, + "learning_rate": 4.4040000000000005e-06, + "loss": 0.2383, + "step": 2205 + }, + { + "epoch": 0.22, + "learning_rate": 4.4140000000000004e-06, + "loss": 0.2093, + "step": 2210 + }, + { + "epoch": 0.22, + "learning_rate": 4.424e-06, + "loss": 0.2279, + "step": 2215 + }, + { + "epoch": 0.22, + "learning_rate": 4.433999999999999e-06, + "loss": 0.2802, + "step": 2220 + }, + { + "epoch": 0.22, + "learning_rate": 4.444e-06, + "loss": 0.2249, + "step": 2225 + }, + { + "epoch": 0.22, + "learning_rate": 4.454e-06, + "loss": 0.2067, + "step": 2230 + }, + { + "epoch": 0.22, + "learning_rate": 4.464e-06, + "loss": 0.2511, + "step": 2235 + }, + { + "epoch": 0.22, + "learning_rate": 4.474000000000001e-06, + "loss": 0.24, + "step": 2240 + }, + { + "epoch": 0.22, + "learning_rate": 4.484e-06, + "loss": 0.1975, + "step": 2245 + }, + { + "epoch": 0.22, + "learning_rate": 4.494e-06, + "loss": 0.2415, + "step": 2250 + }, + { + "epoch": 0.22, + "learning_rate": 4.504e-06, + "loss": 0.2479, + "step": 2255 + }, + { + "epoch": 0.22, + "learning_rate": 4.514e-06, + "loss": 0.2225, + "step": 2260 + }, + { + "epoch": 0.22, + "learning_rate": 4.524e-06, + "loss": 0.2198, + "step": 2265 + }, + { + "epoch": 0.22, + "learning_rate": 4.534e-06, + "loss": 0.2353, + "step": 2270 + }, + { + "epoch": 0.22, + "learning_rate": 4.544e-06, + "loss": 0.202, + "step": 2275 + }, + { + "epoch": 0.22, + "learning_rate": 4.554e-06, + "loss": 0.2242, + "step": 2280 + }, + { + "epoch": 0.22, + "learning_rate": 4.564000000000001e-06, + "loss": 0.2615, + "step": 2285 + }, + { + "epoch": 0.22, + "learning_rate": 4.574e-06, + "loss": 0.2367, + "step": 2290 + }, + { + "epoch": 0.22, + "learning_rate": 4.584e-06, + "loss": 0.2107, + "step": 2295 + }, + { + "epoch": 0.22, + "learning_rate": 4.594e-06, + "loss": 0.2411, + "step": 2300 + }, + { + "epoch": 0.23, + "learning_rate": 4.604e-06, + "loss": 0.2174, + "step": 2305 + }, + { + "epoch": 0.23, + "learning_rate": 4.614e-06, + "loss": 0.2216, + "step": 2310 + }, + { + "epoch": 0.23, + "learning_rate": 4.624e-06, + "loss": 0.2289, + "step": 2315 + }, + { + "epoch": 0.23, + "learning_rate": 4.634e-06, + "loss": 0.2688, + "step": 2320 + }, + { + "epoch": 0.23, + "learning_rate": 4.644e-06, + "loss": 0.2194, + "step": 2325 + }, + { + "epoch": 0.23, + "learning_rate": 4.654000000000001e-06, + "loss": 0.219, + "step": 2330 + }, + { + "epoch": 0.23, + "learning_rate": 4.664000000000001e-06, + "loss": 0.2276, + "step": 2335 + }, + { + "epoch": 0.23, + "learning_rate": 4.674e-06, + "loss": 0.2098, + "step": 2340 + }, + { + "epoch": 0.23, + "learning_rate": 4.684e-06, + "loss": 0.2005, + "step": 2345 + }, + { + "epoch": 0.23, + "learning_rate": 4.694e-06, + "loss": 0.256, + "step": 2350 + }, + { + "epoch": 0.23, + "learning_rate": 4.704e-06, + "loss": 0.2357, + "step": 2355 + }, + { + "epoch": 0.23, + "learning_rate": 4.714000000000001e-06, + "loss": 0.2168, + "step": 2360 + }, + { + "epoch": 0.23, + "learning_rate": 4.724e-06, + "loss": 0.2422, + "step": 2365 + }, + { + "epoch": 0.23, + "learning_rate": 4.734e-06, + "loss": 0.2586, + "step": 2370 + }, + { + "epoch": 0.23, + "learning_rate": 4.744e-06, + "loss": 0.2069, + "step": 2375 + }, + { + "epoch": 0.23, + "learning_rate": 4.7540000000000006e-06, + "loss": 0.2089, + "step": 2380 + }, + { + "epoch": 0.23, + "learning_rate": 4.764e-06, + "loss": 0.2373, + "step": 2385 + }, + { + "epoch": 0.23, + "learning_rate": 4.7739999999999995e-06, + "loss": 0.2212, + "step": 2390 + }, + { + "epoch": 0.23, + "learning_rate": 4.784e-06, + "loss": 0.2117, + "step": 2395 + }, + { + "epoch": 0.23, + "learning_rate": 4.794e-06, + "loss": 0.2356, + "step": 2400 + }, + { + "epoch": 0.24, + "learning_rate": 4.804e-06, + "loss": 0.2208, + "step": 2405 + }, + { + "epoch": 0.24, + "learning_rate": 4.814e-06, + "loss": 0.2098, + "step": 2410 + }, + { + "epoch": 0.24, + "learning_rate": 4.824e-06, + "loss": 0.2315, + "step": 2415 + }, + { + "epoch": 0.24, + "learning_rate": 4.834e-06, + "loss": 0.2311, + "step": 2420 + }, + { + "epoch": 0.24, + "learning_rate": 4.8440000000000005e-06, + "loss": 0.1969, + "step": 2425 + }, + { + "epoch": 0.24, + "learning_rate": 4.8540000000000005e-06, + "loss": 0.2427, + "step": 2430 + }, + { + "epoch": 0.24, + "learning_rate": 4.8639999999999995e-06, + "loss": 0.2593, + "step": 2435 + }, + { + "epoch": 0.24, + "learning_rate": 4.874e-06, + "loss": 0.2154, + "step": 2440 + }, + { + "epoch": 0.24, + "learning_rate": 4.884e-06, + "loss": 0.213, + "step": 2445 + }, + { + "epoch": 0.24, + "learning_rate": 4.894e-06, + "loss": 0.2339, + "step": 2450 + }, + { + "epoch": 0.24, + "learning_rate": 4.904000000000001e-06, + "loss": 0.2395, + "step": 2455 + }, + { + "epoch": 0.24, + "learning_rate": 4.914e-06, + "loss": 0.2067, + "step": 2460 + }, + { + "epoch": 0.24, + "learning_rate": 4.924e-06, + "loss": 0.2346, + "step": 2465 + }, + { + "epoch": 0.24, + "learning_rate": 4.9340000000000005e-06, + "loss": 0.2563, + "step": 2470 + }, + { + "epoch": 0.24, + "learning_rate": 4.9440000000000004e-06, + "loss": 0.2143, + "step": 2475 + }, + { + "epoch": 0.24, + "learning_rate": 4.954e-06, + "loss": 0.2207, + "step": 2480 + }, + { + "epoch": 0.24, + "learning_rate": 4.964e-06, + "loss": 0.2644, + "step": 2485 + }, + { + "epoch": 0.24, + "learning_rate": 4.974e-06, + "loss": 0.1964, + "step": 2490 + }, + { + "epoch": 0.24, + "learning_rate": 4.984e-06, + "loss": 0.2185, + "step": 2495 + }, + { + "epoch": 0.24, + "learning_rate": 4.994000000000001e-06, + "loss": 0.229, + "step": 2500 + }, + { + "epoch": 0.24, + "eval_cer": 0.07526400614145226, + "eval_loss": 0.3628905713558197, + "eval_runtime": 274.2027, + "eval_samples_per_second": 59.7, + "eval_steps_per_second": 1.659, + "eval_wer": 0.20293451218795505, + "step": 2500 + }, + { + "epoch": 0.24, + "learning_rate": 5.004e-06, + "loss": 0.1989, + "step": 2505 + }, + { + "epoch": 0.25, + "learning_rate": 5.014e-06, + "loss": 0.221, + "step": 2510 + }, + { + "epoch": 0.25, + "learning_rate": 5.0240000000000005e-06, + "loss": 0.2216, + "step": 2515 + }, + { + "epoch": 0.25, + "learning_rate": 5.034e-06, + "loss": 0.2244, + "step": 2520 + }, + { + "epoch": 0.25, + "learning_rate": 5.044e-06, + "loss": 0.179, + "step": 2525 + }, + { + "epoch": 0.25, + "learning_rate": 5.053999999999999e-06, + "loss": 0.2024, + "step": 2530 + }, + { + "epoch": 0.25, + "learning_rate": 5.064e-06, + "loss": 0.2544, + "step": 2535 + }, + { + "epoch": 0.25, + "learning_rate": 5.074e-06, + "loss": 0.2397, + "step": 2540 + }, + { + "epoch": 0.25, + "learning_rate": 5.084e-06, + "loss": 0.2013, + "step": 2545 + }, + { + "epoch": 0.25, + "learning_rate": 5.094000000000001e-06, + "loss": 0.2358, + "step": 2550 + }, + { + "epoch": 0.25, + "learning_rate": 5.104e-06, + "loss": 0.2452, + "step": 2555 + }, + { + "epoch": 0.25, + "learning_rate": 5.114e-06, + "loss": 0.2163, + "step": 2560 + }, + { + "epoch": 0.25, + "learning_rate": 5.124e-06, + "loss": 0.2157, + "step": 2565 + }, + { + "epoch": 0.25, + "learning_rate": 5.134e-06, + "loss": 0.2513, + "step": 2570 + }, + { + "epoch": 0.25, + "learning_rate": 5.144e-06, + "loss": 0.2179, + "step": 2575 + }, + { + "epoch": 0.25, + "learning_rate": 5.154e-06, + "loss": 0.2067, + "step": 2580 + }, + { + "epoch": 0.25, + "learning_rate": 5.164e-06, + "loss": 0.231, + "step": 2585 + }, + { + "epoch": 0.25, + "learning_rate": 5.174e-06, + "loss": 0.2137, + "step": 2590 + }, + { + "epoch": 0.25, + "learning_rate": 5.184000000000001e-06, + "loss": 0.2077, + "step": 2595 + }, + { + "epoch": 0.25, + "learning_rate": 5.194e-06, + "loss": 0.2502, + "step": 2600 + }, + { + "epoch": 0.25, + "learning_rate": 5.204e-06, + "loss": 0.2372, + "step": 2605 + }, + { + "epoch": 0.26, + "learning_rate": 5.214e-06, + "loss": 0.2082, + "step": 2610 + }, + { + "epoch": 0.26, + "learning_rate": 5.224e-06, + "loss": 0.2338, + "step": 2615 + }, + { + "epoch": 0.26, + "learning_rate": 5.234e-06, + "loss": 0.2754, + "step": 2620 + }, + { + "epoch": 0.26, + "learning_rate": 5.244e-06, + "loss": 0.206, + "step": 2625 + }, + { + "epoch": 0.26, + "learning_rate": 5.254e-06, + "loss": 0.2147, + "step": 2630 + }, + { + "epoch": 0.26, + "learning_rate": 5.264e-06, + "loss": 0.2449, + "step": 2635 + }, + { + "epoch": 0.26, + "learning_rate": 5.274000000000001e-06, + "loss": 0.211, + "step": 2640 + }, + { + "epoch": 0.26, + "learning_rate": 5.2840000000000006e-06, + "loss": 0.2083, + "step": 2645 + }, + { + "epoch": 0.26, + "learning_rate": 5.294e-06, + "loss": 0.243, + "step": 2650 + }, + { + "epoch": 0.26, + "learning_rate": 5.304e-06, + "loss": 0.2393, + "step": 2655 + }, + { + "epoch": 0.26, + "learning_rate": 5.314e-06, + "loss": 0.2083, + "step": 2660 + }, + { + "epoch": 0.26, + "learning_rate": 5.324e-06, + "loss": 0.2225, + "step": 2665 + }, + { + "epoch": 0.26, + "learning_rate": 5.334000000000001e-06, + "loss": 0.2493, + "step": 2670 + }, + { + "epoch": 0.26, + "learning_rate": 5.344e-06, + "loss": 0.204, + "step": 2675 + }, + { + "epoch": 0.26, + "learning_rate": 5.354e-06, + "loss": 0.2223, + "step": 2680 + }, + { + "epoch": 0.26, + "learning_rate": 5.364e-06, + "loss": 0.2541, + "step": 2685 + }, + { + "epoch": 0.26, + "learning_rate": 5.3740000000000006e-06, + "loss": 0.1936, + "step": 2690 + }, + { + "epoch": 0.26, + "learning_rate": 5.384e-06, + "loss": 0.2057, + "step": 2695 + }, + { + "epoch": 0.26, + "learning_rate": 5.3939999999999995e-06, + "loss": 0.2398, + "step": 2700 + }, + { + "epoch": 0.26, + "learning_rate": 5.404e-06, + "loss": 0.2253, + "step": 2705 + }, + { + "epoch": 0.26, + "learning_rate": 5.414e-06, + "loss": 0.2034, + "step": 2710 + }, + { + "epoch": 0.27, + "learning_rate": 5.424e-06, + "loss": 0.2133, + "step": 2715 + }, + { + "epoch": 0.27, + "learning_rate": 5.434e-06, + "loss": 0.2581, + "step": 2720 + }, + { + "epoch": 0.27, + "learning_rate": 5.444e-06, + "loss": 0.2405, + "step": 2725 + }, + { + "epoch": 0.27, + "learning_rate": 5.454e-06, + "loss": 0.1884, + "step": 2730 + }, + { + "epoch": 0.27, + "learning_rate": 5.4640000000000005e-06, + "loss": 0.2465, + "step": 2735 + }, + { + "epoch": 0.27, + "learning_rate": 5.4740000000000004e-06, + "loss": 0.2263, + "step": 2740 + }, + { + "epoch": 0.27, + "learning_rate": 5.4839999999999995e-06, + "loss": 0.189, + "step": 2745 + }, + { + "epoch": 0.27, + "learning_rate": 5.494e-06, + "loss": 0.2557, + "step": 2750 + }, + { + "epoch": 0.27, + "learning_rate": 5.504e-06, + "loss": 0.2382, + "step": 2755 + }, + { + "epoch": 0.27, + "learning_rate": 5.514e-06, + "loss": 0.206, + "step": 2760 + }, + { + "epoch": 0.27, + "learning_rate": 5.524000000000001e-06, + "loss": 0.1949, + "step": 2765 + }, + { + "epoch": 0.27, + "learning_rate": 5.534e-06, + "loss": 0.2667, + "step": 2770 + }, + { + "epoch": 0.27, + "learning_rate": 5.544e-06, + "loss": 0.1868, + "step": 2775 + }, + { + "epoch": 0.27, + "learning_rate": 5.5540000000000005e-06, + "loss": 0.2142, + "step": 2780 + }, + { + "epoch": 0.27, + "learning_rate": 5.5640000000000004e-06, + "loss": 0.2199, + "step": 2785 + }, + { + "epoch": 0.27, + "learning_rate": 5.574e-06, + "loss": 0.2174, + "step": 2790 + }, + { + "epoch": 0.27, + "learning_rate": 5.584e-06, + "loss": 0.2079, + "step": 2795 + }, + { + "epoch": 0.27, + "learning_rate": 5.594e-06, + "loss": 0.2373, + "step": 2800 + }, + { + "epoch": 0.27, + "learning_rate": 5.604e-06, + "loss": 0.2228, + "step": 2805 + }, + { + "epoch": 0.27, + "learning_rate": 5.614000000000001e-06, + "loss": 0.1799, + "step": 2810 + }, + { + "epoch": 0.28, + "learning_rate": 5.624e-06, + "loss": 0.2236, + "step": 2815 + }, + { + "epoch": 0.28, + "learning_rate": 5.634e-06, + "loss": 0.2459, + "step": 2820 + }, + { + "epoch": 0.28, + "learning_rate": 5.6440000000000005e-06, + "loss": 0.2211, + "step": 2825 + }, + { + "epoch": 0.28, + "learning_rate": 5.654e-06, + "loss": 0.2035, + "step": 2830 + }, + { + "epoch": 0.28, + "learning_rate": 5.664e-06, + "loss": 0.2411, + "step": 2835 + }, + { + "epoch": 0.28, + "learning_rate": 5.673999999999999e-06, + "loss": 0.2006, + "step": 2840 + }, + { + "epoch": 0.28, + "learning_rate": 5.684e-06, + "loss": 0.2165, + "step": 2845 + }, + { + "epoch": 0.28, + "learning_rate": 5.694e-06, + "loss": 0.2204, + "step": 2850 + }, + { + "epoch": 0.28, + "learning_rate": 5.704e-06, + "loss": 0.2325, + "step": 2855 + }, + { + "epoch": 0.28, + "learning_rate": 5.714000000000001e-06, + "loss": 0.1969, + "step": 2860 + }, + { + "epoch": 0.28, + "learning_rate": 5.724e-06, + "loss": 0.2126, + "step": 2865 + }, + { + "epoch": 0.28, + "learning_rate": 5.734e-06, + "loss": 0.2557, + "step": 2870 + }, + { + "epoch": 0.28, + "learning_rate": 5.744e-06, + "loss": 0.1997, + "step": 2875 + }, + { + "epoch": 0.28, + "learning_rate": 5.754e-06, + "loss": 0.2065, + "step": 2880 + }, + { + "epoch": 0.28, + "learning_rate": 5.764e-06, + "loss": 0.2608, + "step": 2885 + }, + { + "epoch": 0.28, + "learning_rate": 5.774e-06, + "loss": 0.2147, + "step": 2890 + }, + { + "epoch": 0.28, + "learning_rate": 5.784e-06, + "loss": 0.2126, + "step": 2895 + }, + { + "epoch": 0.28, + "learning_rate": 5.794e-06, + "loss": 0.2239, + "step": 2900 + }, + { + "epoch": 0.28, + "learning_rate": 5.804000000000001e-06, + "loss": 0.2211, + "step": 2905 + }, + { + "epoch": 0.28, + "learning_rate": 5.814e-06, + "loss": 0.1993, + "step": 2910 + }, + { + "epoch": 0.29, + "learning_rate": 5.824e-06, + "loss": 0.22, + "step": 2915 + }, + { + "epoch": 0.29, + "learning_rate": 5.834e-06, + "loss": 0.2157, + "step": 2920 + }, + { + "epoch": 0.29, + "learning_rate": 5.844e-06, + "loss": 0.209, + "step": 2925 + }, + { + "epoch": 0.29, + "learning_rate": 5.854e-06, + "loss": 0.1959, + "step": 2930 + }, + { + "epoch": 0.29, + "learning_rate": 5.864e-06, + "loss": 0.2407, + "step": 2935 + }, + { + "epoch": 0.29, + "learning_rate": 5.874e-06, + "loss": 0.2259, + "step": 2940 + }, + { + "epoch": 0.29, + "learning_rate": 5.884e-06, + "loss": 0.2067, + "step": 2945 + }, + { + "epoch": 0.29, + "learning_rate": 5.894000000000001e-06, + "loss": 0.2396, + "step": 2950 + }, + { + "epoch": 0.29, + "learning_rate": 5.9040000000000006e-06, + "loss": 0.231, + "step": 2955 + }, + { + "epoch": 0.29, + "learning_rate": 5.914e-06, + "loss": 0.1802, + "step": 2960 + }, + { + "epoch": 0.29, + "learning_rate": 5.924e-06, + "loss": 0.2068, + "step": 2965 + }, + { + "epoch": 0.29, + "learning_rate": 5.934e-06, + "loss": 0.2374, + "step": 2970 + }, + { + "epoch": 0.29, + "learning_rate": 5.944e-06, + "loss": 0.1827, + "step": 2975 + }, + { + "epoch": 0.29, + "learning_rate": 5.954000000000001e-06, + "loss": 0.1962, + "step": 2980 + }, + { + "epoch": 0.29, + "learning_rate": 5.964e-06, + "loss": 0.2401, + "step": 2985 + }, + { + "epoch": 0.29, + "learning_rate": 5.974e-06, + "loss": 0.1983, + "step": 2990 + }, + { + "epoch": 0.29, + "learning_rate": 5.984e-06, + "loss": 0.1909, + "step": 2995 + }, + { + "epoch": 0.29, + "learning_rate": 5.9940000000000005e-06, + "loss": 0.2286, + "step": 3000 + }, + { + "epoch": 0.29, + "eval_cer": 0.07327427735038881, + "eval_loss": 0.34942591190338135, + "eval_runtime": 272.0894, + "eval_samples_per_second": 60.164, + "eval_steps_per_second": 1.672, + "eval_wer": 0.19718824889155886, + "step": 3000 + }, + { + "epoch": 0.29, + "learning_rate": 6.0040000000000005e-06, + "loss": 0.2016, + "step": 3005 + }, + { + "epoch": 0.29, + "learning_rate": 6.0139999999999995e-06, + "loss": 0.1782, + "step": 3010 + }, + { + "epoch": 0.29, + "learning_rate": 6.024e-06, + "loss": 0.2133, + "step": 3015 + }, + { + "epoch": 0.3, + "learning_rate": 6.034e-06, + "loss": 0.2593, + "step": 3020 + }, + { + "epoch": 0.3, + "learning_rate": 6.044e-06, + "loss": 0.188, + "step": 3025 + }, + { + "epoch": 0.3, + "learning_rate": 6.054e-06, + "loss": 0.2057, + "step": 3030 + }, + { + "epoch": 0.3, + "learning_rate": 6.064e-06, + "loss": 0.2331, + "step": 3035 + }, + { + "epoch": 0.3, + "learning_rate": 6.074e-06, + "loss": 0.2196, + "step": 3040 + }, + { + "epoch": 0.3, + "learning_rate": 6.0840000000000005e-06, + "loss": 0.1816, + "step": 3045 + }, + { + "epoch": 0.3, + "learning_rate": 6.0940000000000004e-06, + "loss": 0.2305, + "step": 3050 + }, + { + "epoch": 0.3, + "learning_rate": 6.1039999999999995e-06, + "loss": 0.219, + "step": 3055 + }, + { + "epoch": 0.3, + "learning_rate": 6.114e-06, + "loss": 0.2141, + "step": 3060 + }, + { + "epoch": 0.3, + "learning_rate": 6.124e-06, + "loss": 0.2103, + "step": 3065 + }, + { + "epoch": 0.3, + "learning_rate": 6.134e-06, + "loss": 0.2264, + "step": 3070 + }, + { + "epoch": 0.3, + "learning_rate": 6.144000000000001e-06, + "loss": 0.1864, + "step": 3075 + }, + { + "epoch": 0.3, + "learning_rate": 6.154e-06, + "loss": 0.2255, + "step": 3080 + }, + { + "epoch": 0.3, + "learning_rate": 6.164e-06, + "loss": 0.2563, + "step": 3085 + }, + { + "epoch": 0.3, + "learning_rate": 6.1740000000000005e-06, + "loss": 0.2055, + "step": 3090 + }, + { + "epoch": 0.3, + "learning_rate": 6.184e-06, + "loss": 0.197, + "step": 3095 + }, + { + "epoch": 0.3, + "learning_rate": 6.194e-06, + "loss": 0.2092, + "step": 3100 + }, + { + "epoch": 0.3, + "learning_rate": 6.204e-06, + "loss": 0.2316, + "step": 3105 + }, + { + "epoch": 0.3, + "learning_rate": 6.214e-06, + "loss": 0.179, + "step": 3110 + }, + { + "epoch": 0.3, + "learning_rate": 6.224e-06, + "loss": 0.2116, + "step": 3115 + }, + { + "epoch": 0.31, + "learning_rate": 6.234000000000001e-06, + "loss": 0.223, + "step": 3120 + }, + { + "epoch": 0.31, + "learning_rate": 6.244e-06, + "loss": 0.1834, + "step": 3125 + }, + { + "epoch": 0.31, + "learning_rate": 6.254e-06, + "loss": 0.1982, + "step": 3130 + }, + { + "epoch": 0.31, + "learning_rate": 6.2640000000000005e-06, + "loss": 0.2429, + "step": 3135 + }, + { + "epoch": 0.31, + "learning_rate": 6.274e-06, + "loss": 0.2019, + "step": 3140 + }, + { + "epoch": 0.31, + "learning_rate": 6.284e-06, + "loss": 0.187, + "step": 3145 + }, + { + "epoch": 0.31, + "learning_rate": 6.293999999999999e-06, + "loss": 0.2037, + "step": 3150 + }, + { + "epoch": 0.31, + "learning_rate": 6.304e-06, + "loss": 0.2237, + "step": 3155 + }, + { + "epoch": 0.31, + "learning_rate": 6.314e-06, + "loss": 0.1933, + "step": 3160 + }, + { + "epoch": 0.31, + "learning_rate": 6.324e-06, + "loss": 0.1932, + "step": 3165 + }, + { + "epoch": 0.31, + "learning_rate": 6.334000000000001e-06, + "loss": 0.2279, + "step": 3170 + }, + { + "epoch": 0.31, + "learning_rate": 6.344e-06, + "loss": 0.1916, + "step": 3175 + }, + { + "epoch": 0.31, + "learning_rate": 6.354e-06, + "loss": 0.2116, + "step": 3180 + }, + { + "epoch": 0.31, + "learning_rate": 6.364e-06, + "loss": 0.2315, + "step": 3185 + }, + { + "epoch": 0.31, + "learning_rate": 6.374e-06, + "loss": 0.2106, + "step": 3190 + }, + { + "epoch": 0.31, + "learning_rate": 6.384e-06, + "loss": 0.1785, + "step": 3195 + }, + { + "epoch": 0.31, + "learning_rate": 6.394e-06, + "loss": 0.2074, + "step": 3200 + }, + { + "epoch": 0.31, + "learning_rate": 6.404e-06, + "loss": 0.2332, + "step": 3205 + }, + { + "epoch": 0.31, + "learning_rate": 6.414e-06, + "loss": 0.1871, + "step": 3210 + }, + { + "epoch": 0.31, + "learning_rate": 6.424000000000001e-06, + "loss": 0.2048, + "step": 3215 + }, + { + "epoch": 0.31, + "learning_rate": 6.4340000000000006e-06, + "loss": 0.241, + "step": 3220 + }, + { + "epoch": 0.32, + "learning_rate": 6.444e-06, + "loss": 0.2013, + "step": 3225 + }, + { + "epoch": 0.32, + "learning_rate": 6.454e-06, + "loss": 0.202, + "step": 3230 + }, + { + "epoch": 0.32, + "learning_rate": 6.464e-06, + "loss": 0.248, + "step": 3235 + }, + { + "epoch": 0.32, + "learning_rate": 6.474e-06, + "loss": 0.1813, + "step": 3240 + }, + { + "epoch": 0.32, + "learning_rate": 6.484e-06, + "loss": 0.2019, + "step": 3245 + }, + { + "epoch": 0.32, + "learning_rate": 6.494e-06, + "loss": 0.2419, + "step": 3250 + }, + { + "epoch": 0.32, + "learning_rate": 6.504e-06, + "loss": 0.2155, + "step": 3255 + }, + { + "epoch": 0.32, + "learning_rate": 6.514000000000001e-06, + "loss": 0.1952, + "step": 3260 + }, + { + "epoch": 0.32, + "learning_rate": 6.5240000000000006e-06, + "loss": 0.2037, + "step": 3265 + }, + { + "epoch": 0.32, + "learning_rate": 6.534e-06, + "loss": 0.2466, + "step": 3270 + }, + { + "epoch": 0.32, + "learning_rate": 6.544e-06, + "loss": 0.1991, + "step": 3275 + }, + { + "epoch": 0.32, + "learning_rate": 6.554e-06, + "loss": 0.1918, + "step": 3280 + }, + { + "epoch": 0.32, + "learning_rate": 6.564e-06, + "loss": 0.2362, + "step": 3285 + }, + { + "epoch": 0.32, + "learning_rate": 6.574000000000001e-06, + "loss": 0.2018, + "step": 3290 + }, + { + "epoch": 0.32, + "learning_rate": 6.584e-06, + "loss": 0.2038, + "step": 3295 + }, + { + "epoch": 0.32, + "learning_rate": 6.594e-06, + "loss": 0.2573, + "step": 3300 + }, + { + "epoch": 0.32, + "learning_rate": 6.604e-06, + "loss": 0.2086, + "step": 3305 + }, + { + "epoch": 0.32, + "learning_rate": 6.6140000000000005e-06, + "loss": 0.1931, + "step": 3310 + }, + { + "epoch": 0.32, + "learning_rate": 6.6240000000000004e-06, + "loss": 0.1944, + "step": 3315 + }, + { + "epoch": 0.32, + "learning_rate": 6.6339999999999995e-06, + "loss": 0.2457, + "step": 3320 + }, + { + "epoch": 0.33, + "learning_rate": 6.644e-06, + "loss": 0.1999, + "step": 3325 + }, + { + "epoch": 0.33, + "learning_rate": 6.654e-06, + "loss": 0.2078, + "step": 3330 + }, + { + "epoch": 0.33, + "learning_rate": 6.664e-06, + "loss": 0.2416, + "step": 3335 + }, + { + "epoch": 0.33, + "learning_rate": 6.674e-06, + "loss": 0.1901, + "step": 3340 + }, + { + "epoch": 0.33, + "learning_rate": 6.684e-06, + "loss": 0.1892, + "step": 3345 + }, + { + "epoch": 0.33, + "learning_rate": 6.694e-06, + "loss": 0.2156, + "step": 3350 + }, + { + "epoch": 0.33, + "learning_rate": 6.7040000000000005e-06, + "loss": 0.2149, + "step": 3355 + }, + { + "epoch": 0.33, + "learning_rate": 6.7140000000000004e-06, + "loss": 0.1848, + "step": 3360 + }, + { + "epoch": 0.33, + "learning_rate": 6.7239999999999995e-06, + "loss": 0.2062, + "step": 3365 + }, + { + "epoch": 0.33, + "learning_rate": 6.734e-06, + "loss": 0.2213, + "step": 3370 + }, + { + "epoch": 0.33, + "learning_rate": 6.744e-06, + "loss": 0.1812, + "step": 3375 + }, + { + "epoch": 0.33, + "learning_rate": 6.754e-06, + "loss": 0.212, + "step": 3380 + }, + { + "epoch": 0.33, + "learning_rate": 6.764000000000001e-06, + "loss": 0.2501, + "step": 3385 + }, + { + "epoch": 0.33, + "learning_rate": 6.774e-06, + "loss": 0.1966, + "step": 3390 + }, + { + "epoch": 0.33, + "learning_rate": 6.784e-06, + "loss": 0.1847, + "step": 3395 + }, + { + "epoch": 0.33, + "learning_rate": 6.7940000000000005e-06, + "loss": 0.1979, + "step": 3400 + }, + { + "epoch": 0.33, + "learning_rate": 6.804e-06, + "loss": 0.2243, + "step": 3405 + }, + { + "epoch": 0.33, + "learning_rate": 6.814e-06, + "loss": 0.2047, + "step": 3410 + }, + { + "epoch": 0.33, + "learning_rate": 6.824e-06, + "loss": 0.2097, + "step": 3415 + }, + { + "epoch": 0.33, + "learning_rate": 6.834e-06, + "loss": 0.1987, + "step": 3420 + }, + { + "epoch": 0.33, + "learning_rate": 6.844e-06, + "loss": 0.1835, + "step": 3425 + }, + { + "epoch": 0.34, + "learning_rate": 6.854000000000001e-06, + "loss": 0.1805, + "step": 3430 + }, + { + "epoch": 0.34, + "learning_rate": 6.864000000000001e-06, + "loss": 0.245, + "step": 3435 + }, + { + "epoch": 0.34, + "learning_rate": 6.874e-06, + "loss": 0.2142, + "step": 3440 + }, + { + "epoch": 0.34, + "learning_rate": 6.8840000000000005e-06, + "loss": 0.1742, + "step": 3445 + }, + { + "epoch": 0.34, + "learning_rate": 6.894e-06, + "loss": 0.2212, + "step": 3450 + }, + { + "epoch": 0.34, + "learning_rate": 6.904e-06, + "loss": 0.238, + "step": 3455 + }, + { + "epoch": 0.34, + "learning_rate": 6.913999999999999e-06, + "loss": 0.2041, + "step": 3460 + }, + { + "epoch": 0.34, + "learning_rate": 6.924e-06, + "loss": 0.2107, + "step": 3465 + }, + { + "epoch": 0.34, + "learning_rate": 6.934e-06, + "loss": 0.2204, + "step": 3470 + }, + { + "epoch": 0.34, + "learning_rate": 6.944e-06, + "loss": 0.1821, + "step": 3475 + }, + { + "epoch": 0.34, + "learning_rate": 6.954000000000001e-06, + "loss": 0.1971, + "step": 3480 + }, + { + "epoch": 0.34, + "learning_rate": 6.964e-06, + "loss": 0.2494, + "step": 3485 + }, + { + "epoch": 0.34, + "learning_rate": 6.974e-06, + "loss": 0.1793, + "step": 3490 + }, + { + "epoch": 0.34, + "learning_rate": 6.984e-06, + "loss": 0.2012, + "step": 3495 + }, + { + "epoch": 0.34, + "learning_rate": 6.994e-06, + "loss": 0.2422, + "step": 3500 + }, + { + "epoch": 0.34, + "eval_cer": 0.07202795100711955, + "eval_loss": 0.3364557921886444, + "eval_runtime": 275.4062, + "eval_samples_per_second": 59.439, + "eval_steps_per_second": 1.652, + "eval_wer": 0.19293732002115668, + "step": 3500 + }, + { + "epoch": 0.34, + "learning_rate": 7.004e-06, + "loss": 0.2237, + "step": 3505 + }, + { + "epoch": 0.34, + "learning_rate": 7.014e-06, + "loss": 0.1966, + "step": 3510 + }, + { + "epoch": 0.34, + "learning_rate": 7.024e-06, + "loss": 0.1869, + "step": 3515 + }, + { + "epoch": 0.34, + "learning_rate": 7.034e-06, + "loss": 0.2335, + "step": 3520 + }, + { + "epoch": 0.34, + "learning_rate": 7.044000000000001e-06, + "loss": 0.201, + "step": 3525 + }, + { + "epoch": 0.35, + "learning_rate": 7.0540000000000006e-06, + "loss": 0.2007, + "step": 3530 + }, + { + "epoch": 0.35, + "learning_rate": 7.064e-06, + "loss": 0.2425, + "step": 3535 + }, + { + "epoch": 0.35, + "learning_rate": 7.074e-06, + "loss": 0.1834, + "step": 3540 + }, + { + "epoch": 0.35, + "learning_rate": 7.084e-06, + "loss": 0.1916, + "step": 3545 + }, + { + "epoch": 0.35, + "learning_rate": 7.094e-06, + "loss": 0.2178, + "step": 3550 + }, + { + "epoch": 0.35, + "learning_rate": 7.104e-06, + "loss": 0.2267, + "step": 3555 + }, + { + "epoch": 0.35, + "learning_rate": 7.114e-06, + "loss": 0.1861, + "step": 3560 + }, + { + "epoch": 0.35, + "learning_rate": 7.124e-06, + "loss": 0.21, + "step": 3565 + }, + { + "epoch": 0.35, + "learning_rate": 7.134000000000001e-06, + "loss": 0.2495, + "step": 3570 + }, + { + "epoch": 0.35, + "learning_rate": 7.1440000000000005e-06, + "loss": 0.2191, + "step": 3575 + }, + { + "epoch": 0.35, + "learning_rate": 7.154e-06, + "loss": 0.1731, + "step": 3580 + }, + { + "epoch": 0.35, + "learning_rate": 7.164e-06, + "loss": 0.2486, + "step": 3585 + }, + { + "epoch": 0.35, + "learning_rate": 7.174e-06, + "loss": 0.1928, + "step": 3590 + }, + { + "epoch": 0.35, + "learning_rate": 7.184e-06, + "loss": 0.1868, + "step": 3595 + }, + { + "epoch": 0.35, + "learning_rate": 7.194000000000001e-06, + "loss": 0.2581, + "step": 3600 + }, + { + "epoch": 0.35, + "learning_rate": 7.204e-06, + "loss": 0.2182, + "step": 3605 + }, + { + "epoch": 0.35, + "learning_rate": 7.214e-06, + "loss": 0.2029, + "step": 3610 + }, + { + "epoch": 0.35, + "learning_rate": 7.224e-06, + "loss": 0.2022, + "step": 3615 + }, + { + "epoch": 0.35, + "learning_rate": 7.2340000000000005e-06, + "loss": 0.2441, + "step": 3620 + }, + { + "epoch": 0.35, + "learning_rate": 7.2440000000000004e-06, + "loss": 0.1903, + "step": 3625 + }, + { + "epoch": 0.35, + "learning_rate": 7.2539999999999995e-06, + "loss": 0.1858, + "step": 3630 + }, + { + "epoch": 0.36, + "learning_rate": 7.264e-06, + "loss": 0.2207, + "step": 3635 + }, + { + "epoch": 0.36, + "learning_rate": 7.274e-06, + "loss": 0.1972, + "step": 3640 + }, + { + "epoch": 0.36, + "learning_rate": 7.284e-06, + "loss": 0.1932, + "step": 3645 + }, + { + "epoch": 0.36, + "learning_rate": 7.294000000000001e-06, + "loss": 0.1993, + "step": 3650 + }, + { + "epoch": 0.36, + "learning_rate": 7.304e-06, + "loss": 0.2153, + "step": 3655 + }, + { + "epoch": 0.36, + "learning_rate": 7.314e-06, + "loss": 0.2095, + "step": 3660 + }, + { + "epoch": 0.36, + "learning_rate": 7.3240000000000005e-06, + "loss": 0.192, + "step": 3665 + }, + { + "epoch": 0.36, + "learning_rate": 7.3340000000000004e-06, + "loss": 0.2034, + "step": 3670 + }, + { + "epoch": 0.36, + "learning_rate": 7.3439999999999995e-06, + "loss": 0.221, + "step": 3675 + }, + { + "epoch": 0.36, + "learning_rate": 7.354e-06, + "loss": 0.2065, + "step": 3680 + }, + { + "epoch": 0.36, + "learning_rate": 7.364e-06, + "loss": 0.2134, + "step": 3685 + }, + { + "epoch": 0.36, + "learning_rate": 7.374e-06, + "loss": 0.1978, + "step": 3690 + }, + { + "epoch": 0.36, + "learning_rate": 7.384000000000001e-06, + "loss": 0.1875, + "step": 3695 + }, + { + "epoch": 0.36, + "learning_rate": 7.394e-06, + "loss": 0.2078, + "step": 3700 + }, + { + "epoch": 0.36, + "learning_rate": 7.404e-06, + "loss": 0.2014, + "step": 3705 + }, + { + "epoch": 0.36, + "learning_rate": 7.4140000000000005e-06, + "loss": 0.1997, + "step": 3710 + }, + { + "epoch": 0.36, + "learning_rate": 7.424e-06, + "loss": 0.1951, + "step": 3715 + }, + { + "epoch": 0.36, + "learning_rate": 7.434e-06, + "loss": 0.2078, + "step": 3720 + }, + { + "epoch": 0.36, + "learning_rate": 7.444e-06, + "loss": 0.1835, + "step": 3725 + }, + { + "epoch": 0.36, + "learning_rate": 7.454e-06, + "loss": 0.1789, + "step": 3730 + }, + { + "epoch": 0.37, + "learning_rate": 7.464e-06, + "loss": 0.22, + "step": 3735 + }, + { + "epoch": 0.37, + "learning_rate": 7.474000000000001e-06, + "loss": 0.2021, + "step": 3740 + }, + { + "epoch": 0.37, + "learning_rate": 7.484000000000001e-06, + "loss": 0.1759, + "step": 3745 + }, + { + "epoch": 0.37, + "learning_rate": 7.494e-06, + "loss": 0.203, + "step": 3750 + }, + { + "epoch": 0.37, + "learning_rate": 7.504e-06, + "loss": 0.1975, + "step": 3755 + }, + { + "epoch": 0.37, + "learning_rate": 7.514e-06, + "loss": 0.1737, + "step": 3760 + }, + { + "epoch": 0.37, + "learning_rate": 7.524000000000001e-06, + "loss": 0.192, + "step": 3765 + }, + { + "epoch": 0.37, + "learning_rate": 7.533999999999999e-06, + "loss": 0.2262, + "step": 3770 + }, + { + "epoch": 0.37, + "learning_rate": 7.544e-06, + "loss": 0.1745, + "step": 3775 + }, + { + "epoch": 0.37, + "learning_rate": 7.554000000000001e-06, + "loss": 0.1918, + "step": 3780 + }, + { + "epoch": 0.37, + "learning_rate": 7.564e-06, + "loss": 0.2226, + "step": 3785 + }, + { + "epoch": 0.37, + "learning_rate": 7.574000000000001e-06, + "loss": 0.2084, + "step": 3790 + }, + { + "epoch": 0.37, + "learning_rate": 7.5840000000000006e-06, + "loss": 0.1733, + "step": 3795 + }, + { + "epoch": 0.37, + "learning_rate": 7.594e-06, + "loss": 0.2094, + "step": 3800 + }, + { + "epoch": 0.37, + "learning_rate": 7.604e-06, + "loss": 0.2077, + "step": 3805 + }, + { + "epoch": 0.37, + "learning_rate": 7.614000000000001e-06, + "loss": 0.1862, + "step": 3810 + }, + { + "epoch": 0.37, + "learning_rate": 7.624e-06, + "loss": 0.2156, + "step": 3815 + }, + { + "epoch": 0.37, + "learning_rate": 7.634e-06, + "loss": 0.2128, + "step": 3820 + }, + { + "epoch": 0.37, + "learning_rate": 7.644000000000002e-06, + "loss": 0.1962, + "step": 3825 + }, + { + "epoch": 0.37, + "learning_rate": 7.654e-06, + "loss": 0.1889, + "step": 3830 + }, + { + "epoch": 0.38, + "learning_rate": 7.664e-06, + "loss": 0.1897, + "step": 3835 + }, + { + "epoch": 0.38, + "learning_rate": 7.674000000000001e-06, + "loss": 0.2081, + "step": 3840 + }, + { + "epoch": 0.38, + "learning_rate": 7.684e-06, + "loss": 0.1927, + "step": 3845 + }, + { + "epoch": 0.38, + "learning_rate": 7.694000000000001e-06, + "loss": 0.2289, + "step": 3850 + }, + { + "epoch": 0.38, + "learning_rate": 7.704e-06, + "loss": 0.2089, + "step": 3855 + }, + { + "epoch": 0.38, + "learning_rate": 7.714e-06, + "loss": 0.2127, + "step": 3860 + }, + { + "epoch": 0.38, + "learning_rate": 7.724000000000001e-06, + "loss": 0.1924, + "step": 3865 + }, + { + "epoch": 0.38, + "learning_rate": 7.733999999999999e-06, + "loss": 0.2001, + "step": 3870 + }, + { + "epoch": 0.38, + "learning_rate": 7.744e-06, + "loss": 0.1782, + "step": 3875 + }, + { + "epoch": 0.38, + "learning_rate": 7.754e-06, + "loss": 0.1802, + "step": 3880 + }, + { + "epoch": 0.38, + "learning_rate": 7.763999999999999e-06, + "loss": 0.235, + "step": 3885 + }, + { + "epoch": 0.38, + "learning_rate": 7.774e-06, + "loss": 0.1886, + "step": 3890 + }, + { + "epoch": 0.38, + "learning_rate": 7.784e-06, + "loss": 0.1938, + "step": 3895 + }, + { + "epoch": 0.38, + "learning_rate": 7.794e-06, + "loss": 0.2316, + "step": 3900 + }, + { + "epoch": 0.38, + "learning_rate": 7.804e-06, + "loss": 0.2257, + "step": 3905 + }, + { + "epoch": 0.38, + "learning_rate": 7.814e-06, + "loss": 0.1956, + "step": 3910 + }, + { + "epoch": 0.38, + "learning_rate": 7.824e-06, + "loss": 0.2215, + "step": 3915 + }, + { + "epoch": 0.38, + "learning_rate": 7.834e-06, + "loss": 0.2492, + "step": 3920 + }, + { + "epoch": 0.38, + "learning_rate": 7.844e-06, + "loss": 0.192, + "step": 3925 + }, + { + "epoch": 0.38, + "learning_rate": 7.854e-06, + "loss": 0.2092, + "step": 3930 + }, + { + "epoch": 0.38, + "learning_rate": 7.864e-06, + "loss": 0.2362, + "step": 3935 + }, + { + "epoch": 0.39, + "learning_rate": 7.874000000000001e-06, + "loss": 0.1876, + "step": 3940 + }, + { + "epoch": 0.39, + "learning_rate": 7.884e-06, + "loss": 0.2013, + "step": 3945 + }, + { + "epoch": 0.39, + "learning_rate": 7.894e-06, + "loss": 0.1858, + "step": 3950 + }, + { + "epoch": 0.39, + "learning_rate": 7.904000000000001e-06, + "loss": 0.1906, + "step": 3955 + }, + { + "epoch": 0.39, + "learning_rate": 7.913999999999999e-06, + "loss": 0.1853, + "step": 3960 + }, + { + "epoch": 0.39, + "learning_rate": 7.924e-06, + "loss": 0.2159, + "step": 3965 + }, + { + "epoch": 0.39, + "learning_rate": 7.934e-06, + "loss": 0.2649, + "step": 3970 + }, + { + "epoch": 0.39, + "learning_rate": 7.943999999999999e-06, + "loss": 0.1959, + "step": 3975 + }, + { + "epoch": 0.39, + "learning_rate": 7.954e-06, + "loss": 0.2014, + "step": 3980 + }, + { + "epoch": 0.39, + "learning_rate": 7.964e-06, + "loss": 0.2396, + "step": 3985 + }, + { + "epoch": 0.39, + "learning_rate": 7.974e-06, + "loss": 0.199, + "step": 3990 + }, + { + "epoch": 0.39, + "learning_rate": 7.984e-06, + "loss": 0.1781, + "step": 3995 + }, + { + "epoch": 0.39, + "learning_rate": 7.994e-06, + "loss": 0.1989, + "step": 4000 + }, + { + "epoch": 0.39, + "eval_cer": 0.07107991056047688, + "eval_loss": 0.33616000413894653, + "eval_runtime": 272.3121, + "eval_samples_per_second": 60.115, + "eval_steps_per_second": 1.671, + "eval_wer": 0.19002500930502864, + "step": 4000 + }, + { + "epoch": 0.39, + "learning_rate": 8.004e-06, + "loss": 0.198, + "step": 4005 + }, + { + "epoch": 0.39, + "learning_rate": 8.014e-06, + "loss": 0.1929, + "step": 4010 + }, + { + "epoch": 0.39, + "learning_rate": 8.024000000000001e-06, + "loss": 0.1795, + "step": 4015 + }, + { + "epoch": 0.39, + "learning_rate": 8.034e-06, + "loss": 0.2159, + "step": 4020 + }, + { + "epoch": 0.39, + "learning_rate": 8.044e-06, + "loss": 0.2016, + "step": 4025 + }, + { + "epoch": 0.39, + "learning_rate": 8.054000000000001e-06, + "loss": 0.2112, + "step": 4030 + }, + { + "epoch": 0.39, + "learning_rate": 8.064e-06, + "loss": 0.2482, + "step": 4035 + }, + { + "epoch": 0.4, + "learning_rate": 8.074000000000001e-06, + "loss": 0.1842, + "step": 4040 + }, + { + "epoch": 0.4, + "learning_rate": 8.084000000000001e-06, + "loss": 0.1773, + "step": 4045 + }, + { + "epoch": 0.4, + "learning_rate": 8.093999999999999e-06, + "loss": 0.2132, + "step": 4050 + }, + { + "epoch": 0.4, + "learning_rate": 8.104e-06, + "loss": 0.1887, + "step": 4055 + }, + { + "epoch": 0.4, + "learning_rate": 8.114e-06, + "loss": 0.1902, + "step": 4060 + }, + { + "epoch": 0.4, + "learning_rate": 8.124e-06, + "loss": 0.2071, + "step": 4065 + }, + { + "epoch": 0.4, + "learning_rate": 8.134e-06, + "loss": 0.2301, + "step": 4070 + }, + { + "epoch": 0.4, + "learning_rate": 8.144e-06, + "loss": 0.1762, + "step": 4075 + }, + { + "epoch": 0.4, + "learning_rate": 8.154e-06, + "loss": 0.2064, + "step": 4080 + }, + { + "epoch": 0.4, + "learning_rate": 8.164e-06, + "loss": 0.2285, + "step": 4085 + }, + { + "epoch": 0.4, + "learning_rate": 8.174000000000002e-06, + "loss": 0.2104, + "step": 4090 + }, + { + "epoch": 0.4, + "learning_rate": 8.184e-06, + "loss": 0.1958, + "step": 4095 + }, + { + "epoch": 0.4, + "learning_rate": 8.194e-06, + "loss": 0.1969, + "step": 4100 + }, + { + "epoch": 0.4, + "learning_rate": 8.204000000000001e-06, + "loss": 0.2019, + "step": 4105 + }, + { + "epoch": 0.4, + "learning_rate": 8.214e-06, + "loss": 0.1847, + "step": 4110 + }, + { + "epoch": 0.4, + "learning_rate": 8.224000000000001e-06, + "loss": 0.2113, + "step": 4115 + }, + { + "epoch": 0.4, + "learning_rate": 8.234000000000001e-06, + "loss": 0.2279, + "step": 4120 + }, + { + "epoch": 0.4, + "learning_rate": 8.244e-06, + "loss": 0.1676, + "step": 4125 + }, + { + "epoch": 0.4, + "learning_rate": 8.254000000000001e-06, + "loss": 0.1924, + "step": 4130 + }, + { + "epoch": 0.4, + "learning_rate": 8.264e-06, + "loss": 0.2313, + "step": 4135 + }, + { + "epoch": 0.4, + "learning_rate": 8.274e-06, + "loss": 0.1841, + "step": 4140 + }, + { + "epoch": 0.41, + "learning_rate": 8.284e-06, + "loss": 0.178, + "step": 4145 + }, + { + "epoch": 0.41, + "learning_rate": 8.294e-06, + "loss": 0.2067, + "step": 4150 + }, + { + "epoch": 0.41, + "learning_rate": 8.304e-06, + "loss": 0.2009, + "step": 4155 + }, + { + "epoch": 0.41, + "learning_rate": 8.314e-06, + "loss": 0.1725, + "step": 4160 + }, + { + "epoch": 0.41, + "learning_rate": 8.323999999999999e-06, + "loss": 0.1748, + "step": 4165 + }, + { + "epoch": 0.41, + "learning_rate": 8.334e-06, + "loss": 0.2301, + "step": 4170 + }, + { + "epoch": 0.41, + "learning_rate": 8.344e-06, + "loss": 0.2003, + "step": 4175 + }, + { + "epoch": 0.41, + "learning_rate": 8.354e-06, + "loss": 0.1772, + "step": 4180 + }, + { + "epoch": 0.41, + "learning_rate": 8.364e-06, + "loss": 0.2587, + "step": 4185 + }, + { + "epoch": 0.41, + "learning_rate": 8.374e-06, + "loss": 0.1979, + "step": 4190 + }, + { + "epoch": 0.41, + "learning_rate": 8.384e-06, + "loss": 0.1856, + "step": 4195 + }, + { + "epoch": 0.41, + "learning_rate": 8.394e-06, + "loss": 0.2042, + "step": 4200 + }, + { + "epoch": 0.41, + "learning_rate": 8.404000000000001e-06, + "loss": 0.2075, + "step": 4205 + }, + { + "epoch": 0.41, + "learning_rate": 8.414e-06, + "loss": 0.1753, + "step": 4210 + }, + { + "epoch": 0.41, + "learning_rate": 8.424e-06, + "loss": 0.1915, + "step": 4215 + }, + { + "epoch": 0.41, + "learning_rate": 8.434000000000001e-06, + "loss": 0.2201, + "step": 4220 + }, + { + "epoch": 0.41, + "learning_rate": 8.443999999999999e-06, + "loss": 0.184, + "step": 4225 + }, + { + "epoch": 0.41, + "learning_rate": 8.454e-06, + "loss": 0.2022, + "step": 4230 + }, + { + "epoch": 0.41, + "learning_rate": 8.464e-06, + "loss": 0.2193, + "step": 4235 + }, + { + "epoch": 0.41, + "learning_rate": 8.473999999999999e-06, + "loss": 0.1943, + "step": 4240 + }, + { + "epoch": 0.42, + "learning_rate": 8.484e-06, + "loss": 0.1723, + "step": 4245 + }, + { + "epoch": 0.42, + "learning_rate": 8.494e-06, + "loss": 0.2041, + "step": 4250 + }, + { + "epoch": 0.42, + "learning_rate": 8.504e-06, + "loss": 0.2075, + "step": 4255 + }, + { + "epoch": 0.42, + "learning_rate": 8.514e-06, + "loss": 0.1924, + "step": 4260 + }, + { + "epoch": 0.42, + "learning_rate": 8.524e-06, + "loss": 0.2013, + "step": 4265 + }, + { + "epoch": 0.42, + "learning_rate": 8.534e-06, + "loss": 0.213, + "step": 4270 + }, + { + "epoch": 0.42, + "learning_rate": 8.544e-06, + "loss": 0.1812, + "step": 4275 + }, + { + "epoch": 0.42, + "learning_rate": 8.554000000000001e-06, + "loss": 0.1887, + "step": 4280 + }, + { + "epoch": 0.42, + "learning_rate": 8.564e-06, + "loss": 0.2153, + "step": 4285 + }, + { + "epoch": 0.42, + "learning_rate": 8.574e-06, + "loss": 0.2027, + "step": 4290 + }, + { + "epoch": 0.42, + "learning_rate": 8.584000000000001e-06, + "loss": 0.1776, + "step": 4295 + }, + { + "epoch": 0.42, + "learning_rate": 8.594e-06, + "loss": 0.2192, + "step": 4300 + }, + { + "epoch": 0.42, + "learning_rate": 8.604000000000001e-06, + "loss": 0.2251, + "step": 4305 + }, + { + "epoch": 0.42, + "learning_rate": 8.614000000000001e-06, + "loss": 0.1833, + "step": 4310 + }, + { + "epoch": 0.42, + "learning_rate": 8.623999999999999e-06, + "loss": 0.1901, + "step": 4315 + }, + { + "epoch": 0.42, + "learning_rate": 8.634e-06, + "loss": 0.2287, + "step": 4320 + }, + { + "epoch": 0.42, + "learning_rate": 8.644e-06, + "loss": 0.1853, + "step": 4325 + }, + { + "epoch": 0.42, + "learning_rate": 8.654e-06, + "loss": 0.1682, + "step": 4330 + }, + { + "epoch": 0.42, + "learning_rate": 8.664e-06, + "loss": 0.1988, + "step": 4335 + }, + { + "epoch": 0.42, + "learning_rate": 8.674e-06, + "loss": 0.1864, + "step": 4340 + }, + { + "epoch": 0.42, + "learning_rate": 8.684e-06, + "loss": 0.1853, + "step": 4345 + }, + { + "epoch": 0.43, + "learning_rate": 8.694e-06, + "loss": 0.1915, + "step": 4350 + }, + { + "epoch": 0.43, + "learning_rate": 8.704e-06, + "loss": 0.1978, + "step": 4355 + }, + { + "epoch": 0.43, + "learning_rate": 8.714e-06, + "loss": 0.1659, + "step": 4360 + }, + { + "epoch": 0.43, + "learning_rate": 8.724e-06, + "loss": 0.1935, + "step": 4365 + }, + { + "epoch": 0.43, + "learning_rate": 8.734000000000001e-06, + "loss": 0.2188, + "step": 4370 + }, + { + "epoch": 0.43, + "learning_rate": 8.744e-06, + "loss": 0.1894, + "step": 4375 + }, + { + "epoch": 0.43, + "learning_rate": 8.754e-06, + "loss": 0.1993, + "step": 4380 + }, + { + "epoch": 0.43, + "learning_rate": 8.764000000000001e-06, + "loss": 0.2316, + "step": 4385 + }, + { + "epoch": 0.43, + "learning_rate": 8.774e-06, + "loss": 0.2069, + "step": 4390 + }, + { + "epoch": 0.43, + "learning_rate": 8.784000000000001e-06, + "loss": 0.1734, + "step": 4395 + }, + { + "epoch": 0.43, + "learning_rate": 8.794e-06, + "loss": 0.1879, + "step": 4400 + }, + { + "epoch": 0.43, + "learning_rate": 8.803999999999999e-06, + "loss": 0.2003, + "step": 4405 + }, + { + "epoch": 0.43, + "learning_rate": 8.814e-06, + "loss": 0.1885, + "step": 4410 + }, + { + "epoch": 0.43, + "learning_rate": 8.824e-06, + "loss": 0.1875, + "step": 4415 + }, + { + "epoch": 0.43, + "learning_rate": 8.834e-06, + "loss": 0.2111, + "step": 4420 + }, + { + "epoch": 0.43, + "learning_rate": 8.844e-06, + "loss": 0.1927, + "step": 4425 + }, + { + "epoch": 0.43, + "learning_rate": 8.854e-06, + "loss": 0.1799, + "step": 4430 + }, + { + "epoch": 0.43, + "learning_rate": 8.864e-06, + "loss": 0.2081, + "step": 4435 + }, + { + "epoch": 0.43, + "learning_rate": 8.874e-06, + "loss": 0.1931, + "step": 4440 + }, + { + "epoch": 0.43, + "learning_rate": 8.884000000000002e-06, + "loss": 0.1675, + "step": 4445 + }, + { + "epoch": 0.44, + "learning_rate": 8.894e-06, + "loss": 0.2231, + "step": 4450 + }, + { + "epoch": 0.44, + "learning_rate": 8.904e-06, + "loss": 0.2107, + "step": 4455 + }, + { + "epoch": 0.44, + "learning_rate": 8.914000000000001e-06, + "loss": 0.1799, + "step": 4460 + }, + { + "epoch": 0.44, + "learning_rate": 8.924e-06, + "loss": 0.1843, + "step": 4465 + }, + { + "epoch": 0.44, + "learning_rate": 8.934000000000001e-06, + "loss": 0.2212, + "step": 4470 + }, + { + "epoch": 0.44, + "learning_rate": 8.944e-06, + "loss": 0.1852, + "step": 4475 + }, + { + "epoch": 0.44, + "learning_rate": 8.952e-06, + "loss": 0.1893, + "step": 4480 + }, + { + "epoch": 0.44, + "learning_rate": 8.962e-06, + "loss": 0.234, + "step": 4485 + }, + { + "epoch": 0.44, + "learning_rate": 8.972e-06, + "loss": 0.1893, + "step": 4490 + }, + { + "epoch": 0.44, + "learning_rate": 8.982e-06, + "loss": 0.1634, + "step": 4495 + }, + { + "epoch": 0.44, + "learning_rate": 8.992000000000001e-06, + "loss": 0.2036, + "step": 4500 + }, + { + "epoch": 0.44, + "eval_cer": 0.06956767043339322, + "eval_loss": 0.32818591594696045, + "eval_runtime": 275.6631, + "eval_samples_per_second": 59.384, + "eval_steps_per_second": 1.651, + "eval_wer": 0.18708657921028057, + "step": 4500 + }, + { + "epoch": 0.44, + "learning_rate": 9.002e-06, + "loss": 0.2157, + "step": 4505 + }, + { + "epoch": 0.44, + "learning_rate": 9.012e-06, + "loss": 0.1947, + "step": 4510 + }, + { + "epoch": 0.44, + "learning_rate": 9.022000000000001e-06, + "loss": 0.1906, + "step": 4515 + }, + { + "epoch": 0.44, + "learning_rate": 9.032e-06, + "loss": 0.2326, + "step": 4520 + }, + { + "epoch": 0.44, + "learning_rate": 9.042e-06, + "loss": 0.1757, + "step": 4525 + }, + { + "epoch": 0.44, + "learning_rate": 9.052e-06, + "loss": 0.1981, + "step": 4530 + }, + { + "epoch": 0.44, + "learning_rate": 9.061999999999999e-06, + "loss": 0.2389, + "step": 4535 + }, + { + "epoch": 0.44, + "learning_rate": 9.072e-06, + "loss": 0.1908, + "step": 4540 + }, + { + "epoch": 0.44, + "learning_rate": 9.082e-06, + "loss": 0.1705, + "step": 4545 + }, + { + "epoch": 0.44, + "learning_rate": 9.092e-06, + "loss": 0.195, + "step": 4550 + }, + { + "epoch": 0.45, + "learning_rate": 9.102e-06, + "loss": 0.2036, + "step": 4555 + }, + { + "epoch": 0.45, + "learning_rate": 9.112e-06, + "loss": 0.1583, + "step": 4560 + }, + { + "epoch": 0.45, + "learning_rate": 9.122e-06, + "loss": 0.1864, + "step": 4565 + }, + { + "epoch": 0.45, + "learning_rate": 9.132e-06, + "loss": 0.2181, + "step": 4570 + }, + { + "epoch": 0.45, + "learning_rate": 9.142000000000002e-06, + "loss": 0.158, + "step": 4575 + }, + { + "epoch": 0.45, + "learning_rate": 9.152e-06, + "loss": 0.1711, + "step": 4580 + }, + { + "epoch": 0.45, + "learning_rate": 9.162e-06, + "loss": 0.1979, + "step": 4585 + }, + { + "epoch": 0.45, + "learning_rate": 9.172000000000001e-06, + "loss": 0.2152, + "step": 4590 + }, + { + "epoch": 0.45, + "learning_rate": 9.182e-06, + "loss": 0.1739, + "step": 4595 + }, + { + "epoch": 0.45, + "learning_rate": 9.192000000000001e-06, + "loss": 0.2144, + "step": 4600 + }, + { + "epoch": 0.45, + "learning_rate": 9.202000000000001e-06, + "loss": 0.2015, + "step": 4605 + }, + { + "epoch": 0.45, + "learning_rate": 9.212e-06, + "loss": 0.1793, + "step": 4610 + }, + { + "epoch": 0.45, + "learning_rate": 9.222e-06, + "loss": 0.1782, + "step": 4615 + }, + { + "epoch": 0.45, + "learning_rate": 9.232e-06, + "loss": 0.2277, + "step": 4620 + }, + { + "epoch": 0.45, + "learning_rate": 9.242e-06, + "loss": 0.1879, + "step": 4625 + }, + { + "epoch": 0.45, + "learning_rate": 9.252e-06, + "loss": 0.1679, + "step": 4630 + }, + { + "epoch": 0.45, + "learning_rate": 9.262e-06, + "loss": 0.2196, + "step": 4635 + }, + { + "epoch": 0.45, + "learning_rate": 9.272e-06, + "loss": 0.1912, + "step": 4640 + }, + { + "epoch": 0.45, + "learning_rate": 9.282e-06, + "loss": 0.1674, + "step": 4645 + }, + { + "epoch": 0.45, + "learning_rate": 9.292000000000002e-06, + "loss": 0.2357, + "step": 4650 + }, + { + "epoch": 0.46, + "learning_rate": 9.302e-06, + "loss": 0.2135, + "step": 4655 + }, + { + "epoch": 0.46, + "learning_rate": 9.312e-06, + "loss": 0.1615, + "step": 4660 + }, + { + "epoch": 0.46, + "learning_rate": 9.322e-06, + "loss": 0.1919, + "step": 4665 + }, + { + "epoch": 0.46, + "learning_rate": 9.332e-06, + "loss": 0.2248, + "step": 4670 + }, + { + "epoch": 0.46, + "learning_rate": 9.342000000000001e-06, + "loss": 0.1849, + "step": 4675 + }, + { + "epoch": 0.46, + "learning_rate": 9.352e-06, + "loss": 0.181, + "step": 4680 + }, + { + "epoch": 0.46, + "learning_rate": 9.362e-06, + "loss": 0.2197, + "step": 4685 + }, + { + "epoch": 0.46, + "learning_rate": 9.372000000000001e-06, + "loss": 0.1913, + "step": 4690 + }, + { + "epoch": 0.46, + "learning_rate": 9.382e-06, + "loss": 0.1591, + "step": 4695 + }, + { + "epoch": 0.46, + "learning_rate": 9.392e-06, + "loss": 0.2286, + "step": 4700 + }, + { + "epoch": 0.46, + "learning_rate": 9.402e-06, + "loss": 0.1792, + "step": 4705 + }, + { + "epoch": 0.46, + "learning_rate": 9.411999999999999e-06, + "loss": 0.1794, + "step": 4710 + }, + { + "epoch": 0.46, + "learning_rate": 9.422e-06, + "loss": 0.1761, + "step": 4715 + }, + { + "epoch": 0.46, + "learning_rate": 9.432e-06, + "loss": 0.2265, + "step": 4720 + }, + { + "epoch": 0.46, + "learning_rate": 9.441999999999999e-06, + "loss": 0.1774, + "step": 4725 + }, + { + "epoch": 0.46, + "learning_rate": 9.452e-06, + "loss": 0.1866, + "step": 4730 + }, + { + "epoch": 0.46, + "learning_rate": 9.462e-06, + "loss": 0.2411, + "step": 4735 + }, + { + "epoch": 0.46, + "learning_rate": 9.472e-06, + "loss": 0.1927, + "step": 4740 + }, + { + "epoch": 0.46, + "learning_rate": 9.482e-06, + "loss": 0.1749, + "step": 4745 + }, + { + "epoch": 0.46, + "learning_rate": 9.492e-06, + "loss": 0.1981, + "step": 4750 + }, + { + "epoch": 0.46, + "learning_rate": 9.502e-06, + "loss": 0.1806, + "step": 4755 + }, + { + "epoch": 0.47, + "learning_rate": 9.512e-06, + "loss": 0.167, + "step": 4760 + }, + { + "epoch": 0.47, + "learning_rate": 9.522000000000001e-06, + "loss": 0.2192, + "step": 4765 + }, + { + "epoch": 0.47, + "learning_rate": 9.532e-06, + "loss": 0.205, + "step": 4770 + }, + { + "epoch": 0.47, + "learning_rate": 9.542e-06, + "loss": 0.1795, + "step": 4775 + }, + { + "epoch": 0.47, + "learning_rate": 9.552000000000001e-06, + "loss": 0.1957, + "step": 4780 + }, + { + "epoch": 0.47, + "learning_rate": 9.562e-06, + "loss": 0.2066, + "step": 4785 + }, + { + "epoch": 0.47, + "learning_rate": 9.572000000000001e-06, + "loss": 0.1724, + "step": 4790 + }, + { + "epoch": 0.47, + "learning_rate": 9.582e-06, + "loss": 0.1683, + "step": 4795 + }, + { + "epoch": 0.47, + "learning_rate": 9.591999999999999e-06, + "loss": 0.206, + "step": 4800 + }, + { + "epoch": 0.47, + "learning_rate": 9.602e-06, + "loss": 0.2105, + "step": 4805 + }, + { + "epoch": 0.47, + "learning_rate": 9.612e-06, + "loss": 0.1735, + "step": 4810 + }, + { + "epoch": 0.47, + "learning_rate": 9.622e-06, + "loss": 0.1892, + "step": 4815 + }, + { + "epoch": 0.47, + "learning_rate": 9.632e-06, + "loss": 0.2141, + "step": 4820 + }, + { + "epoch": 0.47, + "learning_rate": 9.642e-06, + "loss": 0.1871, + "step": 4825 + }, + { + "epoch": 0.47, + "learning_rate": 9.652e-06, + "loss": 0.1618, + "step": 4830 + }, + { + "epoch": 0.47, + "learning_rate": 9.662e-06, + "loss": 0.2233, + "step": 4835 + }, + { + "epoch": 0.47, + "learning_rate": 9.672000000000002e-06, + "loss": 0.1725, + "step": 4840 + }, + { + "epoch": 0.47, + "learning_rate": 9.682e-06, + "loss": 0.1585, + "step": 4845 + }, + { + "epoch": 0.47, + "learning_rate": 9.692e-06, + "loss": 0.1953, + "step": 4850 + }, + { + "epoch": 0.47, + "learning_rate": 9.702000000000001e-06, + "loss": 0.2101, + "step": 4855 + }, + { + "epoch": 0.48, + "learning_rate": 9.712e-06, + "loss": 0.1731, + "step": 4860 + }, + { + "epoch": 0.48, + "learning_rate": 9.722000000000001e-06, + "loss": 0.1442, + "step": 4865 + }, + { + "epoch": 0.48, + "learning_rate": 9.732000000000001e-06, + "loss": 0.2237, + "step": 4870 + }, + { + "epoch": 0.48, + "learning_rate": 9.742e-06, + "loss": 0.1739, + "step": 4875 + }, + { + "epoch": 0.48, + "learning_rate": 9.752e-06, + "loss": 0.1959, + "step": 4880 + }, + { + "epoch": 0.48, + "learning_rate": 9.762e-06, + "loss": 0.224, + "step": 4885 + }, + { + "epoch": 0.48, + "learning_rate": 9.772e-06, + "loss": 0.1726, + "step": 4890 + }, + { + "epoch": 0.48, + "learning_rate": 9.782e-06, + "loss": 0.1716, + "step": 4895 + }, + { + "epoch": 0.48, + "learning_rate": 9.792e-06, + "loss": 0.1843, + "step": 4900 + }, + { + "epoch": 0.48, + "learning_rate": 9.802e-06, + "loss": 0.1951, + "step": 4905 + }, + { + "epoch": 0.48, + "learning_rate": 9.812e-06, + "loss": 0.1698, + "step": 4910 + }, + { + "epoch": 0.48, + "learning_rate": 9.822e-06, + "loss": 0.1819, + "step": 4915 + }, + { + "epoch": 0.48, + "learning_rate": 9.832e-06, + "loss": 0.2245, + "step": 4920 + }, + { + "epoch": 0.48, + "learning_rate": 9.842e-06, + "loss": 0.1806, + "step": 4925 + }, + { + "epoch": 0.48, + "learning_rate": 9.852000000000002e-06, + "loss": 0.1987, + "step": 4930 + }, + { + "epoch": 0.48, + "learning_rate": 9.862e-06, + "loss": 0.2065, + "step": 4935 + }, + { + "epoch": 0.48, + "learning_rate": 9.872e-06, + "loss": 0.1851, + "step": 4940 + }, + { + "epoch": 0.48, + "learning_rate": 9.882000000000001e-06, + "loss": 0.1822, + "step": 4945 + }, + { + "epoch": 0.48, + "learning_rate": 9.892e-06, + "loss": 0.1915, + "step": 4950 + }, + { + "epoch": 0.48, + "learning_rate": 9.902000000000001e-06, + "loss": 0.2016, + "step": 4955 + }, + { + "epoch": 0.49, + "learning_rate": 9.912000000000001e-06, + "loss": 0.1772, + "step": 4960 + }, + { + "epoch": 0.49, + "learning_rate": 9.922e-06, + "loss": 0.2081, + "step": 4965 + }, + { + "epoch": 0.49, + "learning_rate": 9.932e-06, + "loss": 0.1953, + "step": 4970 + }, + { + "epoch": 0.49, + "learning_rate": 9.941999999999999e-06, + "loss": 0.1875, + "step": 4975 + }, + { + "epoch": 0.49, + "learning_rate": 9.952e-06, + "loss": 0.1625, + "step": 4980 + }, + { + "epoch": 0.49, + "learning_rate": 9.962e-06, + "loss": 0.1871, + "step": 4985 + }, + { + "epoch": 0.49, + "learning_rate": 9.971999999999999e-06, + "loss": 0.1921, + "step": 4990 + }, + { + "epoch": 0.49, + "learning_rate": 9.982e-06, + "loss": 0.1725, + "step": 4995 + }, + { + "epoch": 0.49, + "learning_rate": 9.992e-06, + "loss": 0.198, + "step": 5000 + }, + { + "epoch": 0.49, + "eval_cer": 0.06768315100896939, + "eval_loss": 0.315591424703598, + "eval_runtime": 272.8439, + "eval_samples_per_second": 59.998, + "eval_steps_per_second": 1.668, + "eval_wer": 0.18033471983701507, + "step": 5000 + }, + { + "epoch": 0.49, + "learning_rate": 1.0002e-05, + "loss": 0.2029, + "step": 5005 + }, + { + "epoch": 0.49, + "learning_rate": 1.0012e-05, + "loss": 0.1609, + "step": 5010 + }, + { + "epoch": 0.49, + "learning_rate": 1.0022e-05, + "loss": 0.1991, + "step": 5015 + }, + { + "epoch": 0.49, + "learning_rate": 1.0032e-05, + "loss": 0.2175, + "step": 5020 + }, + { + "epoch": 0.49, + "learning_rate": 1.0042e-05, + "loss": 0.1745, + "step": 5025 + }, + { + "epoch": 0.49, + "learning_rate": 1.0052000000000001e-05, + "loss": 0.1825, + "step": 5030 + }, + { + "epoch": 0.49, + "learning_rate": 1.0062e-05, + "loss": 0.218, + "step": 5035 + }, + { + "epoch": 0.49, + "learning_rate": 1.0072e-05, + "loss": 0.1753, + "step": 5040 + }, + { + "epoch": 0.49, + "learning_rate": 1.0082000000000001e-05, + "loss": 0.1696, + "step": 5045 + }, + { + "epoch": 0.49, + "learning_rate": 1.0092e-05, + "loss": 0.1894, + "step": 5050 + }, + { + "epoch": 0.49, + "learning_rate": 1.0102000000000001e-05, + "loss": 0.1717, + "step": 5055 + }, + { + "epoch": 0.49, + "learning_rate": 1.0112e-05, + "loss": 0.1714, + "step": 5060 + }, + { + "epoch": 0.5, + "learning_rate": 1.0121999999999999e-05, + "loss": 0.1728, + "step": 5065 + }, + { + "epoch": 0.5, + "learning_rate": 1.0132e-05, + "loss": 0.1993, + "step": 5070 + }, + { + "epoch": 0.5, + "learning_rate": 1.0142e-05, + "loss": 0.1788, + "step": 5075 + }, + { + "epoch": 0.5, + "learning_rate": 1.0152e-05, + "loss": 0.1757, + "step": 5080 + }, + { + "epoch": 0.5, + "learning_rate": 1.0162e-05, + "loss": 0.2619, + "step": 5085 + }, + { + "epoch": 0.5, + "learning_rate": 1.0172e-05, + "loss": 0.1835, + "step": 5090 + }, + { + "epoch": 0.5, + "learning_rate": 1.0182e-05, + "loss": 0.1712, + "step": 5095 + }, + { + "epoch": 0.5, + "learning_rate": 1.0192e-05, + "loss": 0.1985, + "step": 5100 + }, + { + "epoch": 0.5, + "learning_rate": 1.0202000000000002e-05, + "loss": 0.2048, + "step": 5105 + }, + { + "epoch": 0.5, + "learning_rate": 1.0212e-05, + "loss": 0.161, + "step": 5110 + }, + { + "epoch": 0.5, + "learning_rate": 1.0222e-05, + "loss": 0.1841, + "step": 5115 + }, + { + "epoch": 0.5, + "learning_rate": 1.0232000000000001e-05, + "loss": 0.2024, + "step": 5120 + }, + { + "epoch": 0.5, + "learning_rate": 1.0242e-05, + "loss": 0.172, + "step": 5125 + }, + { + "epoch": 0.5, + "learning_rate": 1.0252e-05, + "loss": 0.1972, + "step": 5130 + }, + { + "epoch": 0.5, + "learning_rate": 1.0262000000000001e-05, + "loss": 0.2081, + "step": 5135 + }, + { + "epoch": 0.5, + "learning_rate": 1.0272e-05, + "loss": 0.1774, + "step": 5140 + }, + { + "epoch": 0.5, + "learning_rate": 1.0282e-05, + "loss": 0.1807, + "step": 5145 + }, + { + "epoch": 0.5, + "learning_rate": 1.0292e-05, + "loss": 0.2118, + "step": 5150 + }, + { + "epoch": 0.5, + "learning_rate": 1.0301999999999999e-05, + "loss": 0.2046, + "step": 5155 + }, + { + "epoch": 0.5, + "learning_rate": 1.0312e-05, + "loss": 0.1877, + "step": 5160 + }, + { + "epoch": 0.51, + "learning_rate": 1.0322e-05, + "loss": 0.1963, + "step": 5165 + }, + { + "epoch": 0.51, + "learning_rate": 1.0332e-05, + "loss": 0.2255, + "step": 5170 + }, + { + "epoch": 0.51, + "learning_rate": 1.0342e-05, + "loss": 0.1827, + "step": 5175 + }, + { + "epoch": 0.51, + "learning_rate": 1.0352e-05, + "loss": 0.1798, + "step": 5180 + }, + { + "epoch": 0.51, + "learning_rate": 1.0362e-05, + "loss": 0.1927, + "step": 5185 + }, + { + "epoch": 0.51, + "learning_rate": 1.0372e-05, + "loss": 0.1865, + "step": 5190 + }, + { + "epoch": 0.51, + "learning_rate": 1.0382000000000002e-05, + "loss": 0.1608, + "step": 5195 + }, + { + "epoch": 0.51, + "learning_rate": 1.0392e-05, + "loss": 0.1925, + "step": 5200 + }, + { + "epoch": 0.51, + "learning_rate": 1.0402e-05, + "loss": 0.1983, + "step": 5205 + }, + { + "epoch": 0.51, + "learning_rate": 1.0412000000000001e-05, + "loss": 0.1548, + "step": 5210 + }, + { + "epoch": 0.51, + "learning_rate": 1.0422e-05, + "loss": 0.1828, + "step": 5215 + }, + { + "epoch": 0.51, + "learning_rate": 1.0432000000000001e-05, + "loss": 0.206, + "step": 5220 + }, + { + "epoch": 0.51, + "learning_rate": 1.0442000000000001e-05, + "loss": 0.1733, + "step": 5225 + }, + { + "epoch": 0.51, + "learning_rate": 1.0452e-05, + "loss": 0.156, + "step": 5230 + }, + { + "epoch": 0.51, + "learning_rate": 1.0462e-05, + "loss": 0.194, + "step": 5235 + }, + { + "epoch": 0.51, + "learning_rate": 1.0472e-05, + "loss": 0.1895, + "step": 5240 + }, + { + "epoch": 0.51, + "learning_rate": 1.0482e-05, + "loss": 0.1798, + "step": 5245 + }, + { + "epoch": 0.51, + "learning_rate": 1.0492e-05, + "loss": 0.1778, + "step": 5250 + }, + { + "epoch": 0.51, + "learning_rate": 1.0502e-05, + "loss": 0.202, + "step": 5255 + }, + { + "epoch": 0.51, + "learning_rate": 1.0512e-05, + "loss": 0.1764, + "step": 5260 + }, + { + "epoch": 0.51, + "learning_rate": 1.0522e-05, + "loss": 0.2031, + "step": 5265 + }, + { + "epoch": 0.52, + "learning_rate": 1.0532000000000002e-05, + "loss": 0.1995, + "step": 5270 + }, + { + "epoch": 0.52, + "learning_rate": 1.0542e-05, + "loss": 0.174, + "step": 5275 + }, + { + "epoch": 0.52, + "learning_rate": 1.0552e-05, + "loss": 0.1673, + "step": 5280 + }, + { + "epoch": 0.52, + "learning_rate": 1.0562000000000002e-05, + "loss": 0.2129, + "step": 5285 + }, + { + "epoch": 0.52, + "learning_rate": 1.0572e-05, + "loss": 0.1988, + "step": 5290 + }, + { + "epoch": 0.52, + "learning_rate": 1.0582000000000001e-05, + "loss": 0.1627, + "step": 5295 + }, + { + "epoch": 0.52, + "learning_rate": 1.0592e-05, + "loss": 0.1971, + "step": 5300 + }, + { + "epoch": 0.52, + "learning_rate": 1.0602e-05, + "loss": 0.1838, + "step": 5305 + }, + { + "epoch": 0.52, + "learning_rate": 1.0612000000000001e-05, + "loss": 0.1742, + "step": 5310 + }, + { + "epoch": 0.52, + "learning_rate": 1.0622e-05, + "loss": 0.1804, + "step": 5315 + }, + { + "epoch": 0.52, + "learning_rate": 1.0632000000000001e-05, + "loss": 0.2079, + "step": 5320 + }, + { + "epoch": 0.52, + "learning_rate": 1.0642e-05, + "loss": 0.1714, + "step": 5325 + }, + { + "epoch": 0.52, + "learning_rate": 1.0651999999999999e-05, + "loss": 0.1739, + "step": 5330 + }, + { + "epoch": 0.52, + "learning_rate": 1.0662e-05, + "loss": 0.2064, + "step": 5335 + }, + { + "epoch": 0.52, + "learning_rate": 1.0672e-05, + "loss": 0.1664, + "step": 5340 + }, + { + "epoch": 0.52, + "learning_rate": 1.0682e-05, + "loss": 0.1627, + "step": 5345 + }, + { + "epoch": 0.52, + "learning_rate": 1.0692e-05, + "loss": 0.2022, + "step": 5350 + }, + { + "epoch": 0.52, + "learning_rate": 1.0702e-05, + "loss": 0.1966, + "step": 5355 + }, + { + "epoch": 0.52, + "learning_rate": 1.0712e-05, + "loss": 0.1869, + "step": 5360 + }, + { + "epoch": 0.52, + "learning_rate": 1.0722e-05, + "loss": 0.1703, + "step": 5365 + }, + { + "epoch": 0.53, + "learning_rate": 1.0732e-05, + "loss": 0.2108, + "step": 5370 + }, + { + "epoch": 0.53, + "learning_rate": 1.0742e-05, + "loss": 0.1829, + "step": 5375 + }, + { + "epoch": 0.53, + "learning_rate": 1.0752e-05, + "loss": 0.1703, + "step": 5380 + }, + { + "epoch": 0.53, + "learning_rate": 1.0762000000000001e-05, + "loss": 0.2128, + "step": 5385 + }, + { + "epoch": 0.53, + "learning_rate": 1.0772e-05, + "loss": 0.1611, + "step": 5390 + }, + { + "epoch": 0.53, + "learning_rate": 1.0782e-05, + "loss": 0.1644, + "step": 5395 + }, + { + "epoch": 0.53, + "learning_rate": 1.0792000000000001e-05, + "loss": 0.1873, + "step": 5400 + }, + { + "epoch": 0.53, + "learning_rate": 1.0802e-05, + "loss": 0.1967, + "step": 5405 + }, + { + "epoch": 0.53, + "learning_rate": 1.0812e-05, + "loss": 0.1671, + "step": 5410 + }, + { + "epoch": 0.53, + "learning_rate": 1.0822e-05, + "loss": 0.18, + "step": 5415 + }, + { + "epoch": 0.53, + "learning_rate": 1.0831999999999999e-05, + "loss": 0.1954, + "step": 5420 + }, + { + "epoch": 0.53, + "learning_rate": 1.0842e-05, + "loss": 0.1611, + "step": 5425 + }, + { + "epoch": 0.53, + "learning_rate": 1.0852e-05, + "loss": 0.1798, + "step": 5430 + }, + { + "epoch": 0.53, + "learning_rate": 1.0862e-05, + "loss": 0.2241, + "step": 5435 + }, + { + "epoch": 0.53, + "learning_rate": 1.0872e-05, + "loss": 0.1804, + "step": 5440 + }, + { + "epoch": 0.53, + "learning_rate": 1.0882e-05, + "loss": 0.1543, + "step": 5445 + }, + { + "epoch": 0.53, + "learning_rate": 1.0892e-05, + "loss": 0.1835, + "step": 5450 + }, + { + "epoch": 0.53, + "learning_rate": 1.0902e-05, + "loss": 0.1919, + "step": 5455 + }, + { + "epoch": 0.53, + "learning_rate": 1.0912000000000002e-05, + "loss": 0.1584, + "step": 5460 + }, + { + "epoch": 0.53, + "learning_rate": 1.0922e-05, + "loss": 0.1714, + "step": 5465 + }, + { + "epoch": 0.53, + "learning_rate": 1.0932e-05, + "loss": 0.2106, + "step": 5470 + }, + { + "epoch": 0.54, + "learning_rate": 1.0942000000000001e-05, + "loss": 0.1737, + "step": 5475 + }, + { + "epoch": 0.54, + "learning_rate": 1.0952e-05, + "loss": 0.1799, + "step": 5480 + }, + { + "epoch": 0.54, + "learning_rate": 1.0962000000000001e-05, + "loss": 0.2123, + "step": 5485 + }, + { + "epoch": 0.54, + "learning_rate": 1.0972000000000001e-05, + "loss": 0.1605, + "step": 5490 + }, + { + "epoch": 0.54, + "learning_rate": 1.0982e-05, + "loss": 0.1737, + "step": 5495 + }, + { + "epoch": 0.54, + "learning_rate": 1.0992e-05, + "loss": 0.1757, + "step": 5500 + }, + { + "epoch": 0.54, + "eval_cer": 0.06815832737917688, + "eval_loss": 0.3069358766078949, + "eval_runtime": 273.2905, + "eval_samples_per_second": 59.9, + "eval_steps_per_second": 1.665, + "eval_wer": 0.1797209144394455, + "step": 5500 + }, + { + "epoch": 0.54, + "learning_rate": 1.1002e-05, + "loss": 0.2149, + "step": 5505 + }, + { + "epoch": 0.54, + "learning_rate": 1.1012e-05, + "loss": 0.1717, + "step": 5510 + }, + { + "epoch": 0.54, + "learning_rate": 1.1022e-05, + "loss": 0.1681, + "step": 5515 + }, + { + "epoch": 0.54, + "learning_rate": 1.1032e-05, + "loss": 0.2079, + "step": 5520 + }, + { + "epoch": 0.54, + "learning_rate": 1.1042e-05, + "loss": 0.2063, + "step": 5525 + }, + { + "epoch": 0.54, + "learning_rate": 1.1052e-05, + "loss": 0.1969, + "step": 5530 + }, + { + "epoch": 0.54, + "learning_rate": 1.1062000000000002e-05, + "loss": 0.2142, + "step": 5535 + }, + { + "epoch": 0.54, + "learning_rate": 1.1072e-05, + "loss": 0.1711, + "step": 5540 + }, + { + "epoch": 0.54, + "learning_rate": 1.1082e-05, + "loss": 0.1694, + "step": 5545 + }, + { + "epoch": 0.54, + "learning_rate": 1.1092000000000002e-05, + "loss": 0.1979, + "step": 5550 + }, + { + "epoch": 0.54, + "learning_rate": 1.1102e-05, + "loss": 0.2092, + "step": 5555 + }, + { + "epoch": 0.54, + "learning_rate": 1.1112e-05, + "loss": 0.1823, + "step": 5560 + }, + { + "epoch": 0.54, + "learning_rate": 1.1122000000000001e-05, + "loss": 0.1632, + "step": 5565 + }, + { + "epoch": 0.54, + "learning_rate": 1.1132e-05, + "loss": 0.2008, + "step": 5570 + }, + { + "epoch": 0.55, + "learning_rate": 1.1142000000000001e-05, + "loss": 0.1636, + "step": 5575 + }, + { + "epoch": 0.55, + "learning_rate": 1.1152000000000001e-05, + "loss": 0.1705, + "step": 5580 + }, + { + "epoch": 0.55, + "learning_rate": 1.1162e-05, + "loss": 0.226, + "step": 5585 + }, + { + "epoch": 0.55, + "learning_rate": 1.1172e-05, + "loss": 0.1755, + "step": 5590 + }, + { + "epoch": 0.55, + "learning_rate": 1.1182e-05, + "loss": 0.1779, + "step": 5595 + }, + { + "epoch": 0.55, + "learning_rate": 1.1192e-05, + "loss": 0.2016, + "step": 5600 + }, + { + "epoch": 0.55, + "learning_rate": 1.1202e-05, + "loss": 0.1935, + "step": 5605 + }, + { + "epoch": 0.55, + "learning_rate": 1.1211999999999999e-05, + "loss": 0.1764, + "step": 5610 + }, + { + "epoch": 0.55, + "learning_rate": 1.1222e-05, + "loss": 0.1544, + "step": 5615 + }, + { + "epoch": 0.55, + "learning_rate": 1.1232e-05, + "loss": 0.2098, + "step": 5620 + }, + { + "epoch": 0.55, + "learning_rate": 1.1242e-05, + "loss": 0.1698, + "step": 5625 + }, + { + "epoch": 0.55, + "learning_rate": 1.1252e-05, + "loss": 0.1862, + "step": 5630 + }, + { + "epoch": 0.55, + "learning_rate": 1.1262e-05, + "loss": 0.2104, + "step": 5635 + }, + { + "epoch": 0.55, + "learning_rate": 1.1272e-05, + "loss": 0.1966, + "step": 5640 + }, + { + "epoch": 0.55, + "learning_rate": 1.1282e-05, + "loss": 0.1534, + "step": 5645 + }, + { + "epoch": 0.55, + "learning_rate": 1.1292000000000001e-05, + "loss": 0.1963, + "step": 5650 + }, + { + "epoch": 0.55, + "learning_rate": 1.1302e-05, + "loss": 0.2002, + "step": 5655 + }, + { + "epoch": 0.55, + "learning_rate": 1.1312e-05, + "loss": 0.1754, + "step": 5660 + }, + { + "epoch": 0.55, + "learning_rate": 1.1322000000000001e-05, + "loss": 0.1682, + "step": 5665 + }, + { + "epoch": 0.55, + "learning_rate": 1.1332e-05, + "loss": 0.2034, + "step": 5670 + }, + { + "epoch": 0.55, + "learning_rate": 1.1342e-05, + "loss": 0.1822, + "step": 5675 + }, + { + "epoch": 0.56, + "learning_rate": 1.1352e-05, + "loss": 0.1851, + "step": 5680 + }, + { + "epoch": 0.56, + "learning_rate": 1.1361999999999999e-05, + "loss": 0.2137, + "step": 5685 + }, + { + "epoch": 0.56, + "learning_rate": 1.1372e-05, + "loss": 0.1795, + "step": 5690 + }, + { + "epoch": 0.56, + "learning_rate": 1.1382e-05, + "loss": 0.1624, + "step": 5695 + }, + { + "epoch": 0.56, + "learning_rate": 1.1392e-05, + "loss": 0.1883, + "step": 5700 + }, + { + "epoch": 0.56, + "learning_rate": 1.1402e-05, + "loss": 0.2023, + "step": 5705 + }, + { + "epoch": 0.56, + "learning_rate": 1.1412e-05, + "loss": 0.1624, + "step": 5710 + }, + { + "epoch": 0.56, + "learning_rate": 1.1422e-05, + "loss": 0.1627, + "step": 5715 + }, + { + "epoch": 0.56, + "learning_rate": 1.1432e-05, + "loss": 0.1941, + "step": 5720 + }, + { + "epoch": 0.56, + "learning_rate": 1.1442000000000002e-05, + "loss": 0.1742, + "step": 5725 + }, + { + "epoch": 0.56, + "learning_rate": 1.1452e-05, + "loss": 0.181, + "step": 5730 + }, + { + "epoch": 0.56, + "learning_rate": 1.1462e-05, + "loss": 0.2062, + "step": 5735 + }, + { + "epoch": 0.56, + "learning_rate": 1.1472000000000001e-05, + "loss": 0.1737, + "step": 5740 + }, + { + "epoch": 0.56, + "learning_rate": 1.1482e-05, + "loss": 0.1848, + "step": 5745 + }, + { + "epoch": 0.56, + "learning_rate": 1.1492000000000001e-05, + "loss": 0.1854, + "step": 5750 + }, + { + "epoch": 0.56, + "learning_rate": 1.1502000000000001e-05, + "loss": 0.1845, + "step": 5755 + }, + { + "epoch": 0.56, + "learning_rate": 1.1512e-05, + "loss": 0.1664, + "step": 5760 + }, + { + "epoch": 0.56, + "learning_rate": 1.1522e-05, + "loss": 0.1767, + "step": 5765 + }, + { + "epoch": 0.56, + "learning_rate": 1.1532e-05, + "loss": 0.214, + "step": 5770 + }, + { + "epoch": 0.56, + "learning_rate": 1.1541999999999999e-05, + "loss": 0.183, + "step": 5775 + }, + { + "epoch": 0.57, + "learning_rate": 1.1552e-05, + "loss": 0.1844, + "step": 5780 + }, + { + "epoch": 0.57, + "learning_rate": 1.1562e-05, + "loss": 0.1847, + "step": 5785 + }, + { + "epoch": 0.57, + "learning_rate": 1.1572e-05, + "loss": 0.1607, + "step": 5790 + }, + { + "epoch": 0.57, + "learning_rate": 1.1582e-05, + "loss": 0.1802, + "step": 5795 + }, + { + "epoch": 0.57, + "learning_rate": 1.1592e-05, + "loss": 0.1992, + "step": 5800 + }, + { + "epoch": 0.57, + "learning_rate": 1.1602e-05, + "loss": 0.1962, + "step": 5805 + }, + { + "epoch": 0.57, + "learning_rate": 1.1612e-05, + "loss": 0.1677, + "step": 5810 + }, + { + "epoch": 0.57, + "learning_rate": 1.1622000000000002e-05, + "loss": 0.1751, + "step": 5815 + }, + { + "epoch": 0.57, + "learning_rate": 1.1632e-05, + "loss": 0.2049, + "step": 5820 + }, + { + "epoch": 0.57, + "learning_rate": 1.1642e-05, + "loss": 0.1661, + "step": 5825 + }, + { + "epoch": 0.57, + "learning_rate": 1.1652000000000001e-05, + "loss": 0.177, + "step": 5830 + }, + { + "epoch": 0.57, + "learning_rate": 1.1662e-05, + "loss": 0.1961, + "step": 5835 + }, + { + "epoch": 0.57, + "learning_rate": 1.1672000000000001e-05, + "loss": 0.1625, + "step": 5840 + }, + { + "epoch": 0.57, + "learning_rate": 1.1682000000000001e-05, + "loss": 0.1773, + "step": 5845 + }, + { + "epoch": 0.57, + "learning_rate": 1.1692e-05, + "loss": 0.1784, + "step": 5850 + }, + { + "epoch": 0.57, + "learning_rate": 1.1702e-05, + "loss": 0.1788, + "step": 5855 + }, + { + "epoch": 0.57, + "learning_rate": 1.1712e-05, + "loss": 0.1433, + "step": 5860 + }, + { + "epoch": 0.57, + "learning_rate": 1.1722e-05, + "loss": 0.1599, + "step": 5865 + }, + { + "epoch": 0.57, + "learning_rate": 1.1732e-05, + "loss": 0.2166, + "step": 5870 + }, + { + "epoch": 0.57, + "learning_rate": 1.1742e-05, + "loss": 0.1654, + "step": 5875 + }, + { + "epoch": 0.57, + "learning_rate": 1.1752e-05, + "loss": 0.1983, + "step": 5880 + }, + { + "epoch": 0.58, + "learning_rate": 1.1762e-05, + "loss": 0.1879, + "step": 5885 + }, + { + "epoch": 0.58, + "learning_rate": 1.1772000000000002e-05, + "loss": 0.1811, + "step": 5890 + }, + { + "epoch": 0.58, + "learning_rate": 1.1782e-05, + "loss": 0.1611, + "step": 5895 + }, + { + "epoch": 0.58, + "learning_rate": 1.1792e-05, + "loss": 0.2017, + "step": 5900 + }, + { + "epoch": 0.58, + "learning_rate": 1.1802000000000002e-05, + "loss": 0.2053, + "step": 5905 + }, + { + "epoch": 0.58, + "learning_rate": 1.1812e-05, + "loss": 0.163, + "step": 5910 + }, + { + "epoch": 0.58, + "learning_rate": 1.1822000000000001e-05, + "loss": 0.1692, + "step": 5915 + }, + { + "epoch": 0.58, + "learning_rate": 1.1832e-05, + "loss": 0.21, + "step": 5920 + }, + { + "epoch": 0.58, + "learning_rate": 1.1842e-05, + "loss": 0.1691, + "step": 5925 + }, + { + "epoch": 0.58, + "learning_rate": 1.1852000000000001e-05, + "loss": 0.1566, + "step": 5930 + }, + { + "epoch": 0.58, + "learning_rate": 1.1862e-05, + "loss": 0.2178, + "step": 5935 + }, + { + "epoch": 0.58, + "learning_rate": 1.1872000000000001e-05, + "loss": 0.1743, + "step": 5940 + }, + { + "epoch": 0.58, + "learning_rate": 1.1882e-05, + "loss": 0.1749, + "step": 5945 + }, + { + "epoch": 0.58, + "learning_rate": 1.1891999999999999e-05, + "loss": 0.1836, + "step": 5950 + }, + { + "epoch": 0.58, + "learning_rate": 1.1902e-05, + "loss": 0.1928, + "step": 5955 + }, + { + "epoch": 0.58, + "learning_rate": 1.1912e-05, + "loss": 0.1589, + "step": 5960 + }, + { + "epoch": 0.58, + "learning_rate": 1.1922e-05, + "loss": 0.1778, + "step": 5965 + }, + { + "epoch": 0.58, + "learning_rate": 1.1932e-05, + "loss": 0.1847, + "step": 5970 + }, + { + "epoch": 0.58, + "learning_rate": 1.1942e-05, + "loss": 0.1776, + "step": 5975 + }, + { + "epoch": 0.58, + "learning_rate": 1.1952e-05, + "loss": 0.1551, + "step": 5980 + }, + { + "epoch": 0.59, + "learning_rate": 1.1962e-05, + "loss": 0.1823, + "step": 5985 + }, + { + "epoch": 0.59, + "learning_rate": 1.1972e-05, + "loss": 0.2004, + "step": 5990 + }, + { + "epoch": 0.59, + "learning_rate": 1.1982e-05, + "loss": 0.169, + "step": 5995 + }, + { + "epoch": 0.59, + "learning_rate": 1.1992e-05, + "loss": 0.1966, + "step": 6000 + }, + { + "epoch": 0.59, + "eval_cer": 0.0663408644741497, + "eval_loss": 0.2984313368797302, + "eval_runtime": 273.9548, + "eval_samples_per_second": 59.754, + "eval_steps_per_second": 1.661, + "eval_wer": 0.17860431100344124, + "step": 6000 + }, + { + "epoch": 0.59, + "learning_rate": 1.2002000000000001e-05, + "loss": 0.2027, + "step": 6005 + }, + { + "epoch": 0.59, + "learning_rate": 1.2012e-05, + "loss": 0.1651, + "step": 6010 + }, + { + "epoch": 0.59, + "learning_rate": 1.2022e-05, + "loss": 0.1546, + "step": 6015 + }, + { + "epoch": 0.59, + "learning_rate": 1.2032000000000001e-05, + "loss": 0.2005, + "step": 6020 + }, + { + "epoch": 0.59, + "learning_rate": 1.2042e-05, + "loss": 0.1943, + "step": 6025 + }, + { + "epoch": 0.59, + "learning_rate": 1.2052e-05, + "loss": 0.1924, + "step": 6030 + }, + { + "epoch": 0.59, + "learning_rate": 1.2062e-05, + "loss": 0.1964, + "step": 6035 + }, + { + "epoch": 0.59, + "learning_rate": 1.2071999999999999e-05, + "loss": 0.1702, + "step": 6040 + }, + { + "epoch": 0.59, + "learning_rate": 1.2082e-05, + "loss": 0.1621, + "step": 6045 + }, + { + "epoch": 0.59, + "learning_rate": 1.2092e-05, + "loss": 0.17, + "step": 6050 + }, + { + "epoch": 0.59, + "learning_rate": 1.2102e-05, + "loss": 0.1771, + "step": 6055 + }, + { + "epoch": 0.59, + "learning_rate": 1.2112e-05, + "loss": 0.17, + "step": 6060 + }, + { + "epoch": 0.59, + "learning_rate": 1.2122e-05, + "loss": 0.184, + "step": 6065 + }, + { + "epoch": 0.59, + "learning_rate": 1.2132e-05, + "loss": 0.188, + "step": 6070 + }, + { + "epoch": 0.59, + "learning_rate": 1.2142e-05, + "loss": 0.1663, + "step": 6075 + }, + { + "epoch": 0.59, + "learning_rate": 1.2152000000000002e-05, + "loss": 0.1598, + "step": 6080 + }, + { + "epoch": 0.6, + "learning_rate": 1.2162e-05, + "loss": 0.2121, + "step": 6085 + }, + { + "epoch": 0.6, + "learning_rate": 1.2172e-05, + "loss": 0.1712, + "step": 6090 + }, + { + "epoch": 0.6, + "learning_rate": 1.2182000000000001e-05, + "loss": 0.15, + "step": 6095 + }, + { + "epoch": 0.6, + "learning_rate": 1.2192e-05, + "loss": 0.185, + "step": 6100 + }, + { + "epoch": 0.6, + "learning_rate": 1.2202000000000001e-05, + "loss": 0.1964, + "step": 6105 + }, + { + "epoch": 0.6, + "learning_rate": 1.2212000000000001e-05, + "loss": 0.1646, + "step": 6110 + }, + { + "epoch": 0.6, + "learning_rate": 1.2222e-05, + "loss": 0.1763, + "step": 6115 + }, + { + "epoch": 0.6, + "learning_rate": 1.2232e-05, + "loss": 0.2296, + "step": 6120 + }, + { + "epoch": 0.6, + "learning_rate": 1.2242e-05, + "loss": 0.1813, + "step": 6125 + }, + { + "epoch": 0.6, + "learning_rate": 1.2252e-05, + "loss": 0.1649, + "step": 6130 + }, + { + "epoch": 0.6, + "learning_rate": 1.2262e-05, + "loss": 0.2013, + "step": 6135 + }, + { + "epoch": 0.6, + "learning_rate": 1.2272e-05, + "loss": 0.1669, + "step": 6140 + }, + { + "epoch": 0.6, + "learning_rate": 1.2282e-05, + "loss": 0.1608, + "step": 6145 + }, + { + "epoch": 0.6, + "learning_rate": 1.2292e-05, + "loss": 0.1859, + "step": 6150 + }, + { + "epoch": 0.6, + "learning_rate": 1.2302000000000002e-05, + "loss": 0.1725, + "step": 6155 + }, + { + "epoch": 0.6, + "learning_rate": 1.2312e-05, + "loss": 0.1815, + "step": 6160 + }, + { + "epoch": 0.6, + "learning_rate": 1.2322e-05, + "loss": 0.1582, + "step": 6165 + }, + { + "epoch": 0.6, + "learning_rate": 1.2332000000000002e-05, + "loss": 0.1895, + "step": 6170 + }, + { + "epoch": 0.6, + "learning_rate": 1.2342e-05, + "loss": 0.1678, + "step": 6175 + }, + { + "epoch": 0.6, + "learning_rate": 1.2352000000000001e-05, + "loss": 0.1624, + "step": 6180 + }, + { + "epoch": 0.6, + "learning_rate": 1.2362000000000001e-05, + "loss": 0.194, + "step": 6185 + }, + { + "epoch": 0.61, + "learning_rate": 1.2372e-05, + "loss": 0.1758, + "step": 6190 + }, + { + "epoch": 0.61, + "learning_rate": 1.2382000000000001e-05, + "loss": 0.1673, + "step": 6195 + }, + { + "epoch": 0.61, + "learning_rate": 1.2392000000000001e-05, + "loss": 0.1837, + "step": 6200 + }, + { + "epoch": 0.61, + "learning_rate": 1.2402e-05, + "loss": 0.1887, + "step": 6205 + }, + { + "epoch": 0.61, + "learning_rate": 1.2412e-05, + "loss": 0.172, + "step": 6210 + }, + { + "epoch": 0.61, + "learning_rate": 1.2422e-05, + "loss": 0.1989, + "step": 6215 + }, + { + "epoch": 0.61, + "learning_rate": 1.2432e-05, + "loss": 0.1964, + "step": 6220 + }, + { + "epoch": 0.61, + "learning_rate": 1.2442e-05, + "loss": 0.1569, + "step": 6225 + }, + { + "epoch": 0.61, + "learning_rate": 1.2451999999999999e-05, + "loss": 0.1785, + "step": 6230 + }, + { + "epoch": 0.61, + "learning_rate": 1.2462e-05, + "loss": 0.201, + "step": 6235 + }, + { + "epoch": 0.61, + "learning_rate": 1.2472e-05, + "loss": 0.1663, + "step": 6240 + }, + { + "epoch": 0.61, + "learning_rate": 1.2482e-05, + "loss": 0.1847, + "step": 6245 + }, + { + "epoch": 0.61, + "learning_rate": 1.2492e-05, + "loss": 0.1958, + "step": 6250 + }, + { + "epoch": 0.61, + "learning_rate": 1.2502e-05, + "loss": 0.1965, + "step": 6255 + }, + { + "epoch": 0.61, + "learning_rate": 1.2512e-05, + "loss": 0.1418, + "step": 6260 + }, + { + "epoch": 0.61, + "learning_rate": 1.2522e-05, + "loss": 0.1861, + "step": 6265 + }, + { + "epoch": 0.61, + "learning_rate": 1.2532000000000001e-05, + "loss": 0.1848, + "step": 6270 + }, + { + "epoch": 0.61, + "learning_rate": 1.2542e-05, + "loss": 0.1649, + "step": 6275 + }, + { + "epoch": 0.61, + "learning_rate": 1.2552e-05, + "loss": 0.166, + "step": 6280 + }, + { + "epoch": 0.61, + "learning_rate": 1.2562000000000001e-05, + "loss": 0.213, + "step": 6285 + }, + { + "epoch": 0.62, + "learning_rate": 1.2572e-05, + "loss": 0.1625, + "step": 6290 + }, + { + "epoch": 0.62, + "learning_rate": 1.2582e-05, + "loss": 0.1586, + "step": 6295 + }, + { + "epoch": 0.62, + "learning_rate": 1.2592e-05, + "loss": 0.173, + "step": 6300 + }, + { + "epoch": 0.62, + "learning_rate": 1.2601999999999999e-05, + "loss": 0.1872, + "step": 6305 + }, + { + "epoch": 0.62, + "learning_rate": 1.2612e-05, + "loss": 0.1724, + "step": 6310 + }, + { + "epoch": 0.62, + "learning_rate": 1.2622e-05, + "loss": 0.1902, + "step": 6315 + }, + { + "epoch": 0.62, + "learning_rate": 1.2632e-05, + "loss": 0.19, + "step": 6320 + }, + { + "epoch": 0.62, + "learning_rate": 1.2642e-05, + "loss": 0.1848, + "step": 6325 + }, + { + "epoch": 0.62, + "learning_rate": 1.2652e-05, + "loss": 0.1617, + "step": 6330 + }, + { + "epoch": 0.62, + "learning_rate": 1.2662e-05, + "loss": 0.1949, + "step": 6335 + }, + { + "epoch": 0.62, + "learning_rate": 1.2672e-05, + "loss": 0.1783, + "step": 6340 + }, + { + "epoch": 0.62, + "learning_rate": 1.2682000000000002e-05, + "loss": 0.1602, + "step": 6345 + }, + { + "epoch": 0.62, + "learning_rate": 1.2692e-05, + "loss": 0.1954, + "step": 6350 + }, + { + "epoch": 0.62, + "learning_rate": 1.2702e-05, + "loss": 0.1702, + "step": 6355 + }, + { + "epoch": 0.62, + "learning_rate": 1.2712000000000001e-05, + "loss": 0.159, + "step": 6360 + }, + { + "epoch": 0.62, + "learning_rate": 1.2722e-05, + "loss": 0.2024, + "step": 6365 + }, + { + "epoch": 0.62, + "learning_rate": 1.2732000000000001e-05, + "loss": 0.1931, + "step": 6370 + }, + { + "epoch": 0.62, + "learning_rate": 1.2742000000000001e-05, + "loss": 0.1529, + "step": 6375 + }, + { + "epoch": 0.62, + "learning_rate": 1.2752e-05, + "loss": 0.188, + "step": 6380 + }, + { + "epoch": 0.62, + "learning_rate": 1.2762e-05, + "loss": 0.2074, + "step": 6385 + }, + { + "epoch": 0.62, + "learning_rate": 1.2772e-05, + "loss": 0.1705, + "step": 6390 + }, + { + "epoch": 0.63, + "learning_rate": 1.2782e-05, + "loss": 0.1741, + "step": 6395 + }, + { + "epoch": 0.63, + "learning_rate": 1.2792e-05, + "loss": 0.1678, + "step": 6400 + }, + { + "epoch": 0.63, + "learning_rate": 1.2802e-05, + "loss": 0.1889, + "step": 6405 + }, + { + "epoch": 0.63, + "learning_rate": 1.2812e-05, + "loss": 0.1749, + "step": 6410 + }, + { + "epoch": 0.63, + "learning_rate": 1.2822e-05, + "loss": 0.169, + "step": 6415 + }, + { + "epoch": 0.63, + "learning_rate": 1.2832e-05, + "loss": 0.2101, + "step": 6420 + }, + { + "epoch": 0.63, + "learning_rate": 1.2842e-05, + "loss": 0.1578, + "step": 6425 + }, + { + "epoch": 0.63, + "learning_rate": 1.2852e-05, + "loss": 0.1718, + "step": 6430 + }, + { + "epoch": 0.63, + "learning_rate": 1.2862000000000002e-05, + "loss": 0.2019, + "step": 6435 + }, + { + "epoch": 0.63, + "learning_rate": 1.2872e-05, + "loss": 0.1735, + "step": 6440 + }, + { + "epoch": 0.63, + "learning_rate": 1.2882e-05, + "loss": 0.1702, + "step": 6445 + }, + { + "epoch": 0.63, + "learning_rate": 1.2892000000000001e-05, + "loss": 0.2021, + "step": 6450 + }, + { + "epoch": 0.63, + "learning_rate": 1.2902e-05, + "loss": 0.1788, + "step": 6455 + }, + { + "epoch": 0.63, + "learning_rate": 1.2912000000000001e-05, + "loss": 0.169, + "step": 6460 + }, + { + "epoch": 0.63, + "learning_rate": 1.2922000000000001e-05, + "loss": 0.1565, + "step": 6465 + }, + { + "epoch": 0.63, + "learning_rate": 1.2932e-05, + "loss": 0.2076, + "step": 6470 + }, + { + "epoch": 0.63, + "learning_rate": 1.2942e-05, + "loss": 0.1607, + "step": 6475 + }, + { + "epoch": 0.63, + "learning_rate": 1.2952e-05, + "loss": 0.1497, + "step": 6480 + }, + { + "epoch": 0.63, + "learning_rate": 1.2962e-05, + "loss": 0.1996, + "step": 6485 + }, + { + "epoch": 0.63, + "learning_rate": 1.2972e-05, + "loss": 0.1568, + "step": 6490 + }, + { + "epoch": 0.64, + "learning_rate": 1.2982e-05, + "loss": 0.1747, + "step": 6495 + }, + { + "epoch": 0.64, + "learning_rate": 1.2992e-05, + "loss": 0.1924, + "step": 6500 + }, + { + "epoch": 0.64, + "eval_cer": 0.06756984861412672, + "eval_loss": 0.30143997073173523, + "eval_runtime": 277.1502, + "eval_samples_per_second": 59.065, + "eval_steps_per_second": 1.642, + "eval_wer": 0.17952501909979562, + "step": 6500 + }, + { + "epoch": 0.64, + "learning_rate": 1.3002e-05, + "loss": 0.1856, + "step": 6505 + }, + { + "epoch": 0.64, + "learning_rate": 1.3012000000000002e-05, + "loss": 0.1678, + "step": 6510 + }, + { + "epoch": 0.64, + "learning_rate": 1.3022e-05, + "loss": 0.1745, + "step": 6515 + }, + { + "epoch": 0.64, + "learning_rate": 1.3032e-05, + "loss": 0.1733, + "step": 6520 + }, + { + "epoch": 0.64, + "learning_rate": 1.3042000000000002e-05, + "loss": 0.1656, + "step": 6525 + }, + { + "epoch": 0.64, + "learning_rate": 1.3052e-05, + "loss": 0.1804, + "step": 6530 + }, + { + "epoch": 0.64, + "learning_rate": 1.3062000000000001e-05, + "loss": 0.2091, + "step": 6535 + }, + { + "epoch": 0.64, + "learning_rate": 1.3072e-05, + "loss": 0.1646, + "step": 6540 + }, + { + "epoch": 0.64, + "learning_rate": 1.3082e-05, + "loss": 0.1772, + "step": 6545 + }, + { + "epoch": 0.64, + "learning_rate": 1.3092000000000001e-05, + "loss": 0.1922, + "step": 6550 + }, + { + "epoch": 0.64, + "learning_rate": 1.3102e-05, + "loss": 0.2001, + "step": 6555 + }, + { + "epoch": 0.64, + "learning_rate": 1.3112e-05, + "loss": 0.172, + "step": 6560 + }, + { + "epoch": 0.64, + "learning_rate": 1.3122e-05, + "loss": 0.1636, + "step": 6565 + }, + { + "epoch": 0.64, + "learning_rate": 1.3131999999999999e-05, + "loss": 0.2071, + "step": 6570 + }, + { + "epoch": 0.64, + "learning_rate": 1.3142e-05, + "loss": 0.17, + "step": 6575 + }, + { + "epoch": 0.64, + "learning_rate": 1.3152e-05, + "loss": 0.1555, + "step": 6580 + }, + { + "epoch": 0.64, + "learning_rate": 1.3162e-05, + "loss": 0.1964, + "step": 6585 + }, + { + "epoch": 0.64, + "learning_rate": 1.3172e-05, + "loss": 0.1664, + "step": 6590 + }, + { + "epoch": 0.64, + "learning_rate": 1.3182e-05, + "loss": 0.1565, + "step": 6595 + }, + { + "epoch": 0.65, + "learning_rate": 1.3192e-05, + "loss": 0.1928, + "step": 6600 + }, + { + "epoch": 0.65, + "learning_rate": 1.3202e-05, + "loss": 0.1744, + "step": 6605 + }, + { + "epoch": 0.65, + "learning_rate": 1.3212000000000002e-05, + "loss": 0.1511, + "step": 6610 + }, + { + "epoch": 0.65, + "learning_rate": 1.3222e-05, + "loss": 0.1606, + "step": 6615 + }, + { + "epoch": 0.65, + "learning_rate": 1.3232e-05, + "loss": 0.2108, + "step": 6620 + }, + { + "epoch": 0.65, + "learning_rate": 1.3242000000000001e-05, + "loss": 0.1847, + "step": 6625 + }, + { + "epoch": 0.65, + "learning_rate": 1.3252e-05, + "loss": 0.1615, + "step": 6630 + }, + { + "epoch": 0.65, + "learning_rate": 1.3262e-05, + "loss": 0.2218, + "step": 6635 + }, + { + "epoch": 0.65, + "learning_rate": 1.3272000000000001e-05, + "loss": 0.1642, + "step": 6640 + }, + { + "epoch": 0.65, + "learning_rate": 1.3282e-05, + "loss": 0.1713, + "step": 6645 + }, + { + "epoch": 0.65, + "learning_rate": 1.3292e-05, + "loss": 0.209, + "step": 6650 + }, + { + "epoch": 0.65, + "learning_rate": 1.3302e-05, + "loss": 0.1775, + "step": 6655 + }, + { + "epoch": 0.65, + "learning_rate": 1.3311999999999999e-05, + "loss": 0.1526, + "step": 6660 + }, + { + "epoch": 0.65, + "learning_rate": 1.3322e-05, + "loss": 0.1597, + "step": 6665 + }, + { + "epoch": 0.65, + "learning_rate": 1.3332e-05, + "loss": 0.2078, + "step": 6670 + }, + { + "epoch": 0.65, + "learning_rate": 1.3342e-05, + "loss": 0.1696, + "step": 6675 + }, + { + "epoch": 0.65, + "learning_rate": 1.3352e-05, + "loss": 0.1625, + "step": 6680 + }, + { + "epoch": 0.65, + "learning_rate": 1.3362e-05, + "loss": 0.1889, + "step": 6685 + }, + { + "epoch": 0.65, + "learning_rate": 1.3372e-05, + "loss": 0.1745, + "step": 6690 + }, + { + "epoch": 0.65, + "learning_rate": 1.3382e-05, + "loss": 0.1738, + "step": 6695 + }, + { + "epoch": 0.66, + "learning_rate": 1.3392000000000002e-05, + "loss": 0.1943, + "step": 6700 + }, + { + "epoch": 0.66, + "learning_rate": 1.3402e-05, + "loss": 0.2044, + "step": 6705 + }, + { + "epoch": 0.66, + "learning_rate": 1.3412e-05, + "loss": 0.1719, + "step": 6710 + }, + { + "epoch": 0.66, + "learning_rate": 1.3422000000000001e-05, + "loss": 0.1906, + "step": 6715 + }, + { + "epoch": 0.66, + "learning_rate": 1.3432e-05, + "loss": 0.1895, + "step": 6720 + }, + { + "epoch": 0.66, + "learning_rate": 1.3442000000000001e-05, + "loss": 0.2033, + "step": 6725 + }, + { + "epoch": 0.66, + "learning_rate": 1.3452000000000001e-05, + "loss": 0.1698, + "step": 6730 + }, + { + "epoch": 0.66, + "learning_rate": 1.3462e-05, + "loss": 0.2002, + "step": 6735 + }, + { + "epoch": 0.66, + "learning_rate": 1.3472e-05, + "loss": 0.184, + "step": 6740 + }, + { + "epoch": 0.66, + "learning_rate": 1.3482e-05, + "loss": 0.142, + "step": 6745 + }, + { + "epoch": 0.66, + "learning_rate": 1.3492e-05, + "loss": 0.1824, + "step": 6750 + }, + { + "epoch": 0.66, + "learning_rate": 1.3502e-05, + "loss": 0.1794, + "step": 6755 + }, + { + "epoch": 0.66, + "learning_rate": 1.3512e-05, + "loss": 0.1652, + "step": 6760 + }, + { + "epoch": 0.66, + "learning_rate": 1.3522e-05, + "loss": 0.1727, + "step": 6765 + }, + { + "epoch": 0.66, + "learning_rate": 1.3532e-05, + "loss": 0.217, + "step": 6770 + }, + { + "epoch": 0.66, + "learning_rate": 1.3542000000000002e-05, + "loss": 0.155, + "step": 6775 + }, + { + "epoch": 0.66, + "learning_rate": 1.3552e-05, + "loss": 0.154, + "step": 6780 + }, + { + "epoch": 0.66, + "learning_rate": 1.3562e-05, + "loss": 0.2067, + "step": 6785 + }, + { + "epoch": 0.66, + "learning_rate": 1.3572000000000002e-05, + "loss": 0.1726, + "step": 6790 + }, + { + "epoch": 0.66, + "learning_rate": 1.3582e-05, + "loss": 0.1694, + "step": 6795 + }, + { + "epoch": 0.66, + "learning_rate": 1.3592000000000001e-05, + "loss": 0.1813, + "step": 6800 + }, + { + "epoch": 0.67, + "learning_rate": 1.3602000000000001e-05, + "loss": 0.187, + "step": 6805 + }, + { + "epoch": 0.67, + "learning_rate": 1.3612e-05, + "loss": 0.1544, + "step": 6810 + }, + { + "epoch": 0.67, + "learning_rate": 1.3622000000000001e-05, + "loss": 0.1491, + "step": 6815 + }, + { + "epoch": 0.67, + "learning_rate": 1.3632000000000001e-05, + "loss": 0.1986, + "step": 6820 + }, + { + "epoch": 0.67, + "learning_rate": 1.3642e-05, + "loss": 0.1555, + "step": 6825 + }, + { + "epoch": 0.67, + "learning_rate": 1.3652e-05, + "loss": 0.1546, + "step": 6830 + }, + { + "epoch": 0.67, + "learning_rate": 1.3662e-05, + "loss": 0.2018, + "step": 6835 + }, + { + "epoch": 0.67, + "learning_rate": 1.3672e-05, + "loss": 0.1524, + "step": 6840 + }, + { + "epoch": 0.67, + "learning_rate": 1.3682e-05, + "loss": 0.1643, + "step": 6845 + }, + { + "epoch": 0.67, + "learning_rate": 1.3691999999999999e-05, + "loss": 0.1892, + "step": 6850 + }, + { + "epoch": 0.67, + "learning_rate": 1.3702e-05, + "loss": 0.1994, + "step": 6855 + }, + { + "epoch": 0.67, + "learning_rate": 1.3712e-05, + "loss": 0.148, + "step": 6860 + }, + { + "epoch": 0.67, + "learning_rate": 1.3722e-05, + "loss": 0.1725, + "step": 6865 + }, + { + "epoch": 0.67, + "learning_rate": 1.3732e-05, + "loss": 0.1842, + "step": 6870 + }, + { + "epoch": 0.67, + "learning_rate": 1.3742e-05, + "loss": 0.1797, + "step": 6875 + }, + { + "epoch": 0.67, + "learning_rate": 1.3752e-05, + "loss": 0.1672, + "step": 6880 + }, + { + "epoch": 0.67, + "learning_rate": 1.3762e-05, + "loss": 0.199, + "step": 6885 + }, + { + "epoch": 0.67, + "learning_rate": 1.3772000000000001e-05, + "loss": 0.1884, + "step": 6890 + }, + { + "epoch": 0.67, + "learning_rate": 1.3782e-05, + "loss": 0.1673, + "step": 6895 + }, + { + "epoch": 0.67, + "learning_rate": 1.3792e-05, + "loss": 0.1954, + "step": 6900 + }, + { + "epoch": 0.68, + "learning_rate": 1.3802000000000001e-05, + "loss": 0.1846, + "step": 6905 + }, + { + "epoch": 0.68, + "learning_rate": 1.3812e-05, + "loss": 0.1489, + "step": 6910 + }, + { + "epoch": 0.68, + "learning_rate": 1.3822e-05, + "loss": 0.1662, + "step": 6915 + }, + { + "epoch": 0.68, + "learning_rate": 1.3832e-05, + "loss": 0.2036, + "step": 6920 + }, + { + "epoch": 0.68, + "learning_rate": 1.3841999999999999e-05, + "loss": 0.1622, + "step": 6925 + }, + { + "epoch": 0.68, + "learning_rate": 1.3852e-05, + "loss": 0.1601, + "step": 6930 + }, + { + "epoch": 0.68, + "learning_rate": 1.3862e-05, + "loss": 0.1769, + "step": 6935 + }, + { + "epoch": 0.68, + "learning_rate": 1.3872e-05, + "loss": 0.1759, + "step": 6940 + }, + { + "epoch": 0.68, + "learning_rate": 1.3882e-05, + "loss": 0.1622, + "step": 6945 + }, + { + "epoch": 0.68, + "learning_rate": 1.3892e-05, + "loss": 0.1738, + "step": 6950 + }, + { + "epoch": 0.68, + "learning_rate": 1.3902e-05, + "loss": 0.174, + "step": 6955 + }, + { + "epoch": 0.68, + "learning_rate": 1.3912e-05, + "loss": 0.1505, + "step": 6960 + }, + { + "epoch": 0.68, + "learning_rate": 1.3922000000000002e-05, + "loss": 0.1522, + "step": 6965 + }, + { + "epoch": 0.68, + "learning_rate": 1.3932e-05, + "loss": 0.1851, + "step": 6970 + }, + { + "epoch": 0.68, + "learning_rate": 1.3942e-05, + "loss": 0.1597, + "step": 6975 + }, + { + "epoch": 0.68, + "learning_rate": 1.3952000000000001e-05, + "loss": 0.1622, + "step": 6980 + }, + { + "epoch": 0.68, + "learning_rate": 1.3962e-05, + "loss": 0.1954, + "step": 6985 + }, + { + "epoch": 0.68, + "learning_rate": 1.3972000000000001e-05, + "loss": 0.1565, + "step": 6990 + }, + { + "epoch": 0.68, + "learning_rate": 1.3982000000000001e-05, + "loss": 0.1542, + "step": 6995 + }, + { + "epoch": 0.68, + "learning_rate": 1.399e-05, + "loss": 0.19, + "step": 7000 + }, + { + "epoch": 0.68, + "eval_cer": 0.06561711652342007, + "eval_loss": 0.3058803677558899, + "eval_runtime": 274.2831, + "eval_samples_per_second": 59.683, + "eval_steps_per_second": 1.659, + "eval_wer": 0.17405953912356426, + "step": 7000 + }, + { + "epoch": 0.68, + "learning_rate": 1.4e-05, + "loss": 0.1895, + "step": 7005 + }, + { + "epoch": 0.69, + "learning_rate": 1.4010000000000001e-05, + "loss": 0.1743, + "step": 7010 + }, + { + "epoch": 0.69, + "learning_rate": 1.402e-05, + "loss": 0.1675, + "step": 7015 + }, + { + "epoch": 0.69, + "learning_rate": 1.4030000000000001e-05, + "loss": 0.1902, + "step": 7020 + }, + { + "epoch": 0.69, + "learning_rate": 1.4040000000000001e-05, + "loss": 0.1766, + "step": 7025 + }, + { + "epoch": 0.69, + "learning_rate": 1.405e-05, + "loss": 0.1645, + "step": 7030 + }, + { + "epoch": 0.69, + "learning_rate": 1.4060000000000001e-05, + "loss": 0.2078, + "step": 7035 + }, + { + "epoch": 0.69, + "learning_rate": 1.4069999999999999e-05, + "loss": 0.1658, + "step": 7040 + }, + { + "epoch": 0.69, + "learning_rate": 1.408e-05, + "loss": 0.1699, + "step": 7045 + }, + { + "epoch": 0.69, + "learning_rate": 1.409e-05, + "loss": 0.1745, + "step": 7050 + }, + { + "epoch": 0.69, + "learning_rate": 1.4099999999999999e-05, + "loss": 0.173, + "step": 7055 + }, + { + "epoch": 0.69, + "learning_rate": 1.411e-05, + "loss": 0.1544, + "step": 7060 + }, + { + "epoch": 0.69, + "learning_rate": 1.412e-05, + "loss": 0.1693, + "step": 7065 + }, + { + "epoch": 0.69, + "learning_rate": 1.413e-05, + "loss": 0.1956, + "step": 7070 + }, + { + "epoch": 0.69, + "learning_rate": 1.414e-05, + "loss": 0.1718, + "step": 7075 + }, + { + "epoch": 0.69, + "learning_rate": 1.415e-05, + "loss": 0.1864, + "step": 7080 + }, + { + "epoch": 0.69, + "learning_rate": 1.416e-05, + "loss": 0.174, + "step": 7085 + }, + { + "epoch": 0.69, + "learning_rate": 1.417e-05, + "loss": 0.159, + "step": 7090 + }, + { + "epoch": 0.69, + "learning_rate": 1.4180000000000001e-05, + "loss": 0.1534, + "step": 7095 + }, + { + "epoch": 0.69, + "learning_rate": 1.419e-05, + "loss": 0.1521, + "step": 7100 + }, + { + "epoch": 0.69, + "learning_rate": 1.42e-05, + "loss": 0.179, + "step": 7105 + }, + { + "epoch": 0.7, + "learning_rate": 1.4210000000000001e-05, + "loss": 0.1524, + "step": 7110 + }, + { + "epoch": 0.7, + "learning_rate": 1.422e-05, + "loss": 0.1782, + "step": 7115 + }, + { + "epoch": 0.7, + "learning_rate": 1.4230000000000001e-05, + "loss": 0.2027, + "step": 7120 + }, + { + "epoch": 0.7, + "learning_rate": 1.4240000000000001e-05, + "loss": 0.1575, + "step": 7125 + }, + { + "epoch": 0.7, + "learning_rate": 1.4249999999999999e-05, + "loss": 0.1572, + "step": 7130 + }, + { + "epoch": 0.7, + "learning_rate": 1.426e-05, + "loss": 0.1889, + "step": 7135 + }, + { + "epoch": 0.7, + "learning_rate": 1.427e-05, + "loss": 0.1826, + "step": 7140 + }, + { + "epoch": 0.7, + "learning_rate": 1.428e-05, + "loss": 0.1643, + "step": 7145 + }, + { + "epoch": 0.7, + "learning_rate": 1.429e-05, + "loss": 0.1886, + "step": 7150 + }, + { + "epoch": 0.7, + "learning_rate": 1.43e-05, + "loss": 0.1893, + "step": 7155 + }, + { + "epoch": 0.7, + "learning_rate": 1.431e-05, + "loss": 0.1665, + "step": 7160 + }, + { + "epoch": 0.7, + "learning_rate": 1.432e-05, + "loss": 0.1804, + "step": 7165 + }, + { + "epoch": 0.7, + "learning_rate": 1.4330000000000002e-05, + "loss": 0.193, + "step": 7170 + }, + { + "epoch": 0.7, + "learning_rate": 1.434e-05, + "loss": 0.1799, + "step": 7175 + }, + { + "epoch": 0.7, + "learning_rate": 1.435e-05, + "loss": 0.1628, + "step": 7180 + }, + { + "epoch": 0.7, + "learning_rate": 1.4360000000000001e-05, + "loss": 0.1941, + "step": 7185 + }, + { + "epoch": 0.7, + "learning_rate": 1.437e-05, + "loss": 0.1683, + "step": 7190 + }, + { + "epoch": 0.7, + "learning_rate": 1.438e-05, + "loss": 0.1426, + "step": 7195 + }, + { + "epoch": 0.7, + "learning_rate": 1.4390000000000001e-05, + "loss": 0.1765, + "step": 7200 + }, + { + "epoch": 0.7, + "learning_rate": 1.44e-05, + "loss": 0.1668, + "step": 7205 + }, + { + "epoch": 0.71, + "learning_rate": 1.4410000000000001e-05, + "loss": 0.1747, + "step": 7210 + }, + { + "epoch": 0.71, + "learning_rate": 1.4420000000000001e-05, + "loss": 0.1581, + "step": 7215 + }, + { + "epoch": 0.71, + "learning_rate": 1.4429999999999999e-05, + "loss": 0.2052, + "step": 7220 + }, + { + "epoch": 0.71, + "learning_rate": 1.444e-05, + "loss": 0.1549, + "step": 7225 + }, + { + "epoch": 0.71, + "learning_rate": 1.445e-05, + "loss": 0.1569, + "step": 7230 + }, + { + "epoch": 0.71, + "learning_rate": 1.446e-05, + "loss": 0.2076, + "step": 7235 + }, + { + "epoch": 0.71, + "learning_rate": 1.447e-05, + "loss": 0.1813, + "step": 7240 + }, + { + "epoch": 0.71, + "learning_rate": 1.448e-05, + "loss": 0.1742, + "step": 7245 + }, + { + "epoch": 0.71, + "learning_rate": 1.449e-05, + "loss": 0.1768, + "step": 7250 + }, + { + "epoch": 0.71, + "learning_rate": 1.45e-05, + "loss": 0.1978, + "step": 7255 + }, + { + "epoch": 0.71, + "learning_rate": 1.4510000000000002e-05, + "loss": 0.1638, + "step": 7260 + }, + { + "epoch": 0.71, + "learning_rate": 1.452e-05, + "loss": 0.1565, + "step": 7265 + }, + { + "epoch": 0.71, + "learning_rate": 1.453e-05, + "loss": 0.1884, + "step": 7270 + }, + { + "epoch": 0.71, + "learning_rate": 1.4540000000000001e-05, + "loss": 0.1706, + "step": 7275 + }, + { + "epoch": 0.71, + "learning_rate": 1.455e-05, + "loss": 0.183, + "step": 7280 + }, + { + "epoch": 0.71, + "learning_rate": 1.4560000000000001e-05, + "loss": 0.1883, + "step": 7285 + }, + { + "epoch": 0.71, + "learning_rate": 1.4570000000000001e-05, + "loss": 0.1893, + "step": 7290 + }, + { + "epoch": 0.71, + "learning_rate": 1.458e-05, + "loss": 0.1398, + "step": 7295 + }, + { + "epoch": 0.71, + "learning_rate": 1.4590000000000001e-05, + "loss": 0.1937, + "step": 7300 + }, + { + "epoch": 0.71, + "learning_rate": 1.46e-05, + "loss": 0.1906, + "step": 7305 + }, + { + "epoch": 0.71, + "learning_rate": 1.461e-05, + "loss": 0.159, + "step": 7310 + }, + { + "epoch": 0.72, + "learning_rate": 1.462e-05, + "loss": 0.1534, + "step": 7315 + }, + { + "epoch": 0.72, + "learning_rate": 1.463e-05, + "loss": 0.221, + "step": 7320 + }, + { + "epoch": 0.72, + "learning_rate": 1.464e-05, + "loss": 0.1561, + "step": 7325 + }, + { + "epoch": 0.72, + "learning_rate": 1.465e-05, + "loss": 0.1553, + "step": 7330 + }, + { + "epoch": 0.72, + "learning_rate": 1.4660000000000002e-05, + "loss": 0.1742, + "step": 7335 + }, + { + "epoch": 0.72, + "learning_rate": 1.467e-05, + "loss": 0.1724, + "step": 7340 + }, + { + "epoch": 0.72, + "learning_rate": 1.468e-05, + "loss": 0.1583, + "step": 7345 + }, + { + "epoch": 0.72, + "learning_rate": 1.469e-05, + "loss": 0.1812, + "step": 7350 + }, + { + "epoch": 0.72, + "learning_rate": 1.47e-05, + "loss": 0.188, + "step": 7355 + }, + { + "epoch": 0.72, + "learning_rate": 1.4710000000000001e-05, + "loss": 0.1571, + "step": 7360 + }, + { + "epoch": 0.72, + "learning_rate": 1.472e-05, + "loss": 0.1621, + "step": 7365 + }, + { + "epoch": 0.72, + "learning_rate": 1.473e-05, + "loss": 0.2059, + "step": 7370 + }, + { + "epoch": 0.72, + "learning_rate": 1.4740000000000001e-05, + "loss": 0.1556, + "step": 7375 + }, + { + "epoch": 0.72, + "learning_rate": 1.475e-05, + "loss": 0.1597, + "step": 7380 + }, + { + "epoch": 0.72, + "learning_rate": 1.4760000000000001e-05, + "loss": 0.2018, + "step": 7385 + }, + { + "epoch": 0.72, + "learning_rate": 1.4770000000000001e-05, + "loss": 0.1629, + "step": 7390 + }, + { + "epoch": 0.72, + "learning_rate": 1.4779999999999999e-05, + "loss": 0.1513, + "step": 7395 + }, + { + "epoch": 0.72, + "learning_rate": 1.479e-05, + "loss": 0.1879, + "step": 7400 + }, + { + "epoch": 0.72, + "learning_rate": 1.48e-05, + "loss": 0.1956, + "step": 7405 + }, + { + "epoch": 0.72, + "learning_rate": 1.4809999999999999e-05, + "loss": 0.1599, + "step": 7410 + }, + { + "epoch": 0.73, + "learning_rate": 1.482e-05, + "loss": 0.1697, + "step": 7415 + }, + { + "epoch": 0.73, + "learning_rate": 1.483e-05, + "loss": 0.2155, + "step": 7420 + }, + { + "epoch": 0.73, + "learning_rate": 1.484e-05, + "loss": 0.1566, + "step": 7425 + }, + { + "epoch": 0.73, + "learning_rate": 1.485e-05, + "loss": 0.1653, + "step": 7430 + }, + { + "epoch": 0.73, + "learning_rate": 1.486e-05, + "loss": 0.1996, + "step": 7435 + }, + { + "epoch": 0.73, + "learning_rate": 1.487e-05, + "loss": 0.1787, + "step": 7440 + }, + { + "epoch": 0.73, + "learning_rate": 1.488e-05, + "loss": 0.1672, + "step": 7445 + }, + { + "epoch": 0.73, + "learning_rate": 1.4890000000000001e-05, + "loss": 0.1901, + "step": 7450 + }, + { + "epoch": 0.73, + "learning_rate": 1.49e-05, + "loss": 0.1633, + "step": 7455 + }, + { + "epoch": 0.73, + "learning_rate": 1.491e-05, + "loss": 0.1586, + "step": 7460 + }, + { + "epoch": 0.73, + "learning_rate": 1.4920000000000001e-05, + "loss": 0.1792, + "step": 7465 + }, + { + "epoch": 0.73, + "learning_rate": 1.493e-05, + "loss": 0.1892, + "step": 7470 + }, + { + "epoch": 0.73, + "learning_rate": 1.4940000000000001e-05, + "loss": 0.1685, + "step": 7475 + }, + { + "epoch": 0.73, + "learning_rate": 1.4950000000000001e-05, + "loss": 0.1603, + "step": 7480 + }, + { + "epoch": 0.73, + "learning_rate": 1.4959999999999999e-05, + "loss": 0.1988, + "step": 7485 + }, + { + "epoch": 0.73, + "learning_rate": 1.497e-05, + "loss": 0.151, + "step": 7490 + }, + { + "epoch": 0.73, + "learning_rate": 1.498e-05, + "loss": 0.1419, + "step": 7495 + }, + { + "epoch": 0.73, + "learning_rate": 1.499e-05, + "loss": 0.1723, + "step": 7500 + }, + { + "epoch": 0.73, + "eval_cer": 0.06731780859294612, + "eval_loss": 0.30364254117012024, + "eval_runtime": 277.1356, + "eval_samples_per_second": 59.069, + "eval_steps_per_second": 1.642, + "eval_wer": 0.17582912702506806, + "step": 7500 + }, + { + "epoch": 0.73, + "learning_rate": 1.5e-05, + "loss": 0.1843, + "step": 7505 + }, + { + "epoch": 0.73, + "learning_rate": 1.5009999999999999e-05, + "loss": 0.1708, + "step": 7510 + }, + { + "epoch": 0.73, + "learning_rate": 1.5020000000000002e-05, + "loss": 0.1837, + "step": 7515 + }, + { + "epoch": 0.74, + "learning_rate": 1.503e-05, + "loss": 0.2127, + "step": 7520 + }, + { + "epoch": 0.74, + "learning_rate": 1.504e-05, + "loss": 0.1788, + "step": 7525 + }, + { + "epoch": 0.74, + "learning_rate": 1.5050000000000002e-05, + "loss": 0.1672, + "step": 7530 + }, + { + "epoch": 0.74, + "learning_rate": 1.506e-05, + "loss": 0.1786, + "step": 7535 + }, + { + "epoch": 0.74, + "learning_rate": 1.507e-05, + "loss": 0.1742, + "step": 7540 + }, + { + "epoch": 0.74, + "learning_rate": 1.5080000000000001e-05, + "loss": 0.1619, + "step": 7545 + }, + { + "epoch": 0.74, + "learning_rate": 1.5090000000000001e-05, + "loss": 0.1692, + "step": 7550 + }, + { + "epoch": 0.74, + "learning_rate": 1.51e-05, + "loss": 0.1695, + "step": 7555 + }, + { + "epoch": 0.74, + "learning_rate": 1.5110000000000001e-05, + "loss": 0.138, + "step": 7560 + }, + { + "epoch": 0.74, + "learning_rate": 1.5120000000000001e-05, + "loss": 0.1572, + "step": 7565 + }, + { + "epoch": 0.74, + "learning_rate": 1.5129999999999999e-05, + "loss": 0.1905, + "step": 7570 + }, + { + "epoch": 0.74, + "learning_rate": 1.5140000000000002e-05, + "loss": 0.1594, + "step": 7575 + }, + { + "epoch": 0.74, + "learning_rate": 1.515e-05, + "loss": 0.1521, + "step": 7580 + }, + { + "epoch": 0.74, + "learning_rate": 1.5159999999999999e-05, + "loss": 0.194, + "step": 7585 + }, + { + "epoch": 0.74, + "learning_rate": 1.5170000000000002e-05, + "loss": 0.1587, + "step": 7590 + }, + { + "epoch": 0.74, + "learning_rate": 1.518e-05, + "loss": 0.1578, + "step": 7595 + }, + { + "epoch": 0.74, + "learning_rate": 1.519e-05, + "loss": 0.1844, + "step": 7600 + }, + { + "epoch": 0.74, + "learning_rate": 1.5200000000000002e-05, + "loss": 0.158, + "step": 7605 + }, + { + "epoch": 0.74, + "learning_rate": 1.521e-05, + "loss": 0.1572, + "step": 7610 + }, + { + "epoch": 0.74, + "learning_rate": 1.522e-05, + "loss": 0.1826, + "step": 7615 + }, + { + "epoch": 0.75, + "learning_rate": 1.5230000000000002e-05, + "loss": 0.2139, + "step": 7620 + }, + { + "epoch": 0.75, + "learning_rate": 1.524e-05, + "loss": 0.1652, + "step": 7625 + }, + { + "epoch": 0.75, + "learning_rate": 1.525e-05, + "loss": 0.1685, + "step": 7630 + }, + { + "epoch": 0.75, + "learning_rate": 1.5260000000000003e-05, + "loss": 0.1955, + "step": 7635 + }, + { + "epoch": 0.75, + "learning_rate": 1.527e-05, + "loss": 0.1521, + "step": 7640 + }, + { + "epoch": 0.75, + "learning_rate": 1.528e-05, + "loss": 0.1601, + "step": 7645 + }, + { + "epoch": 0.75, + "learning_rate": 1.529e-05, + "loss": 0.1736, + "step": 7650 + }, + { + "epoch": 0.75, + "learning_rate": 1.53e-05, + "loss": 0.1884, + "step": 7655 + }, + { + "epoch": 0.75, + "learning_rate": 1.531e-05, + "loss": 0.1723, + "step": 7660 + }, + { + "epoch": 0.75, + "learning_rate": 1.5320000000000002e-05, + "loss": 0.1688, + "step": 7665 + }, + { + "epoch": 0.75, + "learning_rate": 1.533e-05, + "loss": 0.2092, + "step": 7670 + }, + { + "epoch": 0.75, + "learning_rate": 1.534e-05, + "loss": 0.1519, + "step": 7675 + }, + { + "epoch": 0.75, + "learning_rate": 1.535e-05, + "loss": 0.161, + "step": 7680 + }, + { + "epoch": 0.75, + "learning_rate": 1.5360000000000002e-05, + "loss": 0.192, + "step": 7685 + }, + { + "epoch": 0.75, + "learning_rate": 1.537e-05, + "loss": 0.1735, + "step": 7690 + }, + { + "epoch": 0.75, + "learning_rate": 1.5380000000000002e-05, + "loss": 0.1551, + "step": 7695 + }, + { + "epoch": 0.75, + "learning_rate": 1.539e-05, + "loss": 0.178, + "step": 7700 + }, + { + "epoch": 0.75, + "learning_rate": 1.5399999999999998e-05, + "loss": 0.1938, + "step": 7705 + }, + { + "epoch": 0.75, + "learning_rate": 1.5410000000000003e-05, + "loss": 0.1589, + "step": 7710 + }, + { + "epoch": 0.75, + "learning_rate": 1.542e-05, + "loss": 0.1613, + "step": 7715 + }, + { + "epoch": 0.75, + "learning_rate": 1.543e-05, + "loss": 0.194, + "step": 7720 + }, + { + "epoch": 0.76, + "learning_rate": 1.544e-05, + "loss": 0.1776, + "step": 7725 + }, + { + "epoch": 0.76, + "learning_rate": 1.545e-05, + "loss": 0.1761, + "step": 7730 + }, + { + "epoch": 0.76, + "learning_rate": 1.546e-05, + "loss": 0.1712, + "step": 7735 + }, + { + "epoch": 0.76, + "learning_rate": 1.5470000000000003e-05, + "loss": 0.1504, + "step": 7740 + }, + { + "epoch": 0.76, + "learning_rate": 1.548e-05, + "loss": 0.1625, + "step": 7745 + }, + { + "epoch": 0.76, + "learning_rate": 1.549e-05, + "loss": 0.1922, + "step": 7750 + }, + { + "epoch": 0.76, + "learning_rate": 1.55e-05, + "loss": 0.1796, + "step": 7755 + }, + { + "epoch": 0.76, + "learning_rate": 1.5510000000000002e-05, + "loss": 0.1605, + "step": 7760 + }, + { + "epoch": 0.76, + "learning_rate": 1.552e-05, + "loss": 0.158, + "step": 7765 + }, + { + "epoch": 0.76, + "learning_rate": 1.5530000000000002e-05, + "loss": 0.1863, + "step": 7770 + }, + { + "epoch": 0.76, + "learning_rate": 1.554e-05, + "loss": 0.1522, + "step": 7775 + }, + { + "epoch": 0.76, + "learning_rate": 1.555e-05, + "loss": 0.1777, + "step": 7780 + }, + { + "epoch": 0.76, + "learning_rate": 1.5560000000000003e-05, + "loss": 0.1964, + "step": 7785 + }, + { + "epoch": 0.76, + "learning_rate": 1.5570000000000002e-05, + "loss": 0.1456, + "step": 7790 + }, + { + "epoch": 0.76, + "learning_rate": 1.558e-05, + "loss": 0.1626, + "step": 7795 + }, + { + "epoch": 0.76, + "learning_rate": 1.559e-05, + "loss": 0.185, + "step": 7800 + }, + { + "epoch": 0.76, + "learning_rate": 1.56e-05, + "loss": 0.2009, + "step": 7805 + }, + { + "epoch": 0.76, + "learning_rate": 1.561e-05, + "loss": 0.1597, + "step": 7810 + }, + { + "epoch": 0.76, + "learning_rate": 1.5620000000000003e-05, + "loss": 0.1644, + "step": 7815 + }, + { + "epoch": 0.76, + "learning_rate": 1.563e-05, + "loss": 0.1907, + "step": 7820 + }, + { + "epoch": 0.77, + "learning_rate": 1.564e-05, + "loss": 0.1613, + "step": 7825 + }, + { + "epoch": 0.77, + "learning_rate": 1.5649999999999998e-05, + "loss": 0.1612, + "step": 7830 + }, + { + "epoch": 0.77, + "learning_rate": 1.5660000000000003e-05, + "loss": 0.1874, + "step": 7835 + }, + { + "epoch": 0.77, + "learning_rate": 1.567e-05, + "loss": 0.1697, + "step": 7840 + }, + { + "epoch": 0.77, + "learning_rate": 1.568e-05, + "loss": 0.1529, + "step": 7845 + }, + { + "epoch": 0.77, + "learning_rate": 1.569e-05, + "loss": 0.1637, + "step": 7850 + }, + { + "epoch": 0.77, + "learning_rate": 1.57e-05, + "loss": 0.1785, + "step": 7855 + }, + { + "epoch": 0.77, + "learning_rate": 1.571e-05, + "loss": 0.1386, + "step": 7860 + }, + { + "epoch": 0.77, + "learning_rate": 1.5720000000000002e-05, + "loss": 0.1782, + "step": 7865 + }, + { + "epoch": 0.77, + "learning_rate": 1.573e-05, + "loss": 0.2023, + "step": 7870 + }, + { + "epoch": 0.77, + "learning_rate": 1.574e-05, + "loss": 0.1503, + "step": 7875 + }, + { + "epoch": 0.77, + "learning_rate": 1.575e-05, + "loss": 0.1745, + "step": 7880 + }, + { + "epoch": 0.77, + "learning_rate": 1.576e-05, + "loss": 0.1968, + "step": 7885 + }, + { + "epoch": 0.77, + "learning_rate": 1.577e-05, + "loss": 0.1921, + "step": 7890 + }, + { + "epoch": 0.77, + "learning_rate": 1.578e-05, + "loss": 0.1512, + "step": 7895 + }, + { + "epoch": 0.77, + "learning_rate": 1.579e-05, + "loss": 0.1919, + "step": 7900 + }, + { + "epoch": 0.77, + "learning_rate": 1.5799999999999998e-05, + "loss": 0.2117, + "step": 7905 + }, + { + "epoch": 0.77, + "learning_rate": 1.5810000000000003e-05, + "loss": 0.1676, + "step": 7910 + }, + { + "epoch": 0.77, + "learning_rate": 1.582e-05, + "loss": 0.1575, + "step": 7915 + }, + { + "epoch": 0.77, + "learning_rate": 1.583e-05, + "loss": 0.1885, + "step": 7920 + }, + { + "epoch": 0.77, + "learning_rate": 1.584e-05, + "loss": 0.1646, + "step": 7925 + }, + { + "epoch": 0.78, + "learning_rate": 1.585e-05, + "loss": 0.1719, + "step": 7930 + }, + { + "epoch": 0.78, + "learning_rate": 1.586e-05, + "loss": 0.1751, + "step": 7935 + }, + { + "epoch": 0.78, + "learning_rate": 1.5870000000000002e-05, + "loss": 0.1866, + "step": 7940 + }, + { + "epoch": 0.78, + "learning_rate": 1.588e-05, + "loss": 0.1487, + "step": 7945 + }, + { + "epoch": 0.78, + "learning_rate": 1.589e-05, + "loss": 0.1657, + "step": 7950 + }, + { + "epoch": 0.78, + "learning_rate": 1.59e-05, + "loss": 0.1807, + "step": 7955 + }, + { + "epoch": 0.78, + "learning_rate": 1.591e-05, + "loss": 0.1597, + "step": 7960 + }, + { + "epoch": 0.78, + "learning_rate": 1.592e-05, + "loss": 0.1792, + "step": 7965 + }, + { + "epoch": 0.78, + "learning_rate": 1.593e-05, + "loss": 0.2125, + "step": 7970 + }, + { + "epoch": 0.78, + "learning_rate": 1.594e-05, + "loss": 0.1434, + "step": 7975 + }, + { + "epoch": 0.78, + "learning_rate": 1.5949999999999998e-05, + "loss": 0.1566, + "step": 7980 + }, + { + "epoch": 0.78, + "learning_rate": 1.596e-05, + "loss": 0.1887, + "step": 7985 + }, + { + "epoch": 0.78, + "learning_rate": 1.597e-05, + "loss": 0.1866, + "step": 7990 + }, + { + "epoch": 0.78, + "learning_rate": 1.598e-05, + "loss": 0.1675, + "step": 7995 + }, + { + "epoch": 0.78, + "learning_rate": 1.599e-05, + "loss": 0.1688, + "step": 8000 + }, + { + "epoch": 0.78, + "eval_cer": 0.06702183499009182, + "eval_loss": 0.29900655150413513, + "eval_runtime": 275.044, + "eval_samples_per_second": 59.518, + "eval_steps_per_second": 1.654, + "eval_wer": 0.17492800846267867, + "step": 8000 + }, + { + "epoch": 0.78, + "learning_rate": 1.6e-05, + "loss": 0.1694, + "step": 8005 + }, + { + "epoch": 0.78, + "learning_rate": 1.6009999999999997e-05, + "loss": 0.1384, + "step": 8010 + }, + { + "epoch": 0.78, + "learning_rate": 1.6020000000000002e-05, + "loss": 0.168, + "step": 8015 + }, + { + "epoch": 0.78, + "learning_rate": 1.603e-05, + "loss": 0.1852, + "step": 8020 + }, + { + "epoch": 0.78, + "learning_rate": 1.604e-05, + "loss": 0.1649, + "step": 8025 + }, + { + "epoch": 0.79, + "learning_rate": 1.605e-05, + "loss": 0.1475, + "step": 8030 + }, + { + "epoch": 0.79, + "learning_rate": 1.606e-05, + "loss": 0.1906, + "step": 8035 + }, + { + "epoch": 0.79, + "learning_rate": 1.607e-05, + "loss": 0.1608, + "step": 8040 + }, + { + "epoch": 0.79, + "learning_rate": 1.6080000000000002e-05, + "loss": 0.1497, + "step": 8045 + }, + { + "epoch": 0.79, + "learning_rate": 1.609e-05, + "loss": 0.1914, + "step": 8050 + }, + { + "epoch": 0.79, + "learning_rate": 1.61e-05, + "loss": 0.1599, + "step": 8055 + }, + { + "epoch": 0.79, + "learning_rate": 1.611e-05, + "loss": 0.1667, + "step": 8060 + }, + { + "epoch": 0.79, + "learning_rate": 1.612e-05, + "loss": 0.1694, + "step": 8065 + }, + { + "epoch": 0.79, + "learning_rate": 1.613e-05, + "loss": 0.1921, + "step": 8070 + }, + { + "epoch": 0.79, + "learning_rate": 1.614e-05, + "loss": 0.1495, + "step": 8075 + }, + { + "epoch": 0.79, + "learning_rate": 1.615e-05, + "loss": 0.1478, + "step": 8080 + }, + { + "epoch": 0.79, + "learning_rate": 1.6159999999999998e-05, + "loss": 0.1986, + "step": 8085 + }, + { + "epoch": 0.79, + "learning_rate": 1.6170000000000003e-05, + "loss": 0.1561, + "step": 8090 + }, + { + "epoch": 0.79, + "learning_rate": 1.618e-05, + "loss": 0.1484, + "step": 8095 + }, + { + "epoch": 0.79, + "learning_rate": 1.619e-05, + "loss": 0.1757, + "step": 8100 + }, + { + "epoch": 0.79, + "learning_rate": 1.62e-05, + "loss": 0.1833, + "step": 8105 + }, + { + "epoch": 0.79, + "learning_rate": 1.621e-05, + "loss": 0.1512, + "step": 8110 + }, + { + "epoch": 0.79, + "learning_rate": 1.622e-05, + "loss": 0.1632, + "step": 8115 + }, + { + "epoch": 0.79, + "learning_rate": 1.6230000000000002e-05, + "loss": 0.1841, + "step": 8120 + }, + { + "epoch": 0.79, + "learning_rate": 1.624e-05, + "loss": 0.1642, + "step": 8125 + }, + { + "epoch": 0.79, + "learning_rate": 1.625e-05, + "loss": 0.1418, + "step": 8130 + }, + { + "epoch": 0.8, + "learning_rate": 1.626e-05, + "loss": 0.1783, + "step": 8135 + }, + { + "epoch": 0.8, + "learning_rate": 1.6270000000000002e-05, + "loss": 0.1709, + "step": 8140 + }, + { + "epoch": 0.8, + "learning_rate": 1.628e-05, + "loss": 0.1556, + "step": 8145 + }, + { + "epoch": 0.8, + "learning_rate": 1.629e-05, + "loss": 0.1755, + "step": 8150 + }, + { + "epoch": 0.8, + "learning_rate": 1.63e-05, + "loss": 0.1783, + "step": 8155 + }, + { + "epoch": 0.8, + "learning_rate": 1.6309999999999998e-05, + "loss": 0.1773, + "step": 8160 + }, + { + "epoch": 0.8, + "learning_rate": 1.6320000000000003e-05, + "loss": 0.16, + "step": 8165 + }, + { + "epoch": 0.8, + "learning_rate": 1.633e-05, + "loss": 0.1953, + "step": 8170 + }, + { + "epoch": 0.8, + "learning_rate": 1.634e-05, + "loss": 0.1566, + "step": 8175 + }, + { + "epoch": 0.8, + "learning_rate": 1.635e-05, + "loss": 0.1383, + "step": 8180 + }, + { + "epoch": 0.8, + "learning_rate": 1.636e-05, + "loss": 0.2004, + "step": 8185 + }, + { + "epoch": 0.8, + "learning_rate": 1.637e-05, + "loss": 0.1514, + "step": 8190 + }, + { + "epoch": 0.8, + "learning_rate": 1.6380000000000002e-05, + "loss": 0.1867, + "step": 8195 + }, + { + "epoch": 0.8, + "learning_rate": 1.639e-05, + "loss": 0.2072, + "step": 8200 + }, + { + "epoch": 0.8, + "learning_rate": 1.64e-05, + "loss": 0.1962, + "step": 8205 + }, + { + "epoch": 0.8, + "learning_rate": 1.641e-05, + "loss": 0.156, + "step": 8210 + }, + { + "epoch": 0.8, + "learning_rate": 1.6420000000000002e-05, + "loss": 0.1601, + "step": 8215 + }, + { + "epoch": 0.8, + "learning_rate": 1.643e-05, + "loss": 0.1731, + "step": 8220 + }, + { + "epoch": 0.8, + "learning_rate": 1.6440000000000002e-05, + "loss": 0.1534, + "step": 8225 + }, + { + "epoch": 0.8, + "learning_rate": 1.645e-05, + "loss": 0.1591, + "step": 8230 + }, + { + "epoch": 0.81, + "learning_rate": 1.6459999999999998e-05, + "loss": 0.1833, + "step": 8235 + }, + { + "epoch": 0.81, + "learning_rate": 1.6470000000000003e-05, + "loss": 0.1853, + "step": 8240 + }, + { + "epoch": 0.81, + "learning_rate": 1.648e-05, + "loss": 0.165, + "step": 8245 + }, + { + "epoch": 0.81, + "learning_rate": 1.649e-05, + "loss": 0.1779, + "step": 8250 + }, + { + "epoch": 0.81, + "learning_rate": 1.65e-05, + "loss": 0.1957, + "step": 8255 + }, + { + "epoch": 0.81, + "learning_rate": 1.651e-05, + "loss": 0.1649, + "step": 8260 + }, + { + "epoch": 0.81, + "learning_rate": 1.652e-05, + "loss": 0.1729, + "step": 8265 + }, + { + "epoch": 0.81, + "learning_rate": 1.6530000000000003e-05, + "loss": 0.1846, + "step": 8270 + }, + { + "epoch": 0.81, + "learning_rate": 1.654e-05, + "loss": 0.1634, + "step": 8275 + }, + { + "epoch": 0.81, + "learning_rate": 1.655e-05, + "loss": 0.1551, + "step": 8280 + }, + { + "epoch": 0.81, + "learning_rate": 1.656e-05, + "loss": 0.1921, + "step": 8285 + }, + { + "epoch": 0.81, + "learning_rate": 1.6570000000000002e-05, + "loss": 0.1794, + "step": 8290 + }, + { + "epoch": 0.81, + "learning_rate": 1.658e-05, + "loss": 0.1539, + "step": 8295 + }, + { + "epoch": 0.81, + "learning_rate": 1.6590000000000002e-05, + "loss": 0.1816, + "step": 8300 + }, + { + "epoch": 0.81, + "learning_rate": 1.66e-05, + "loss": 0.184, + "step": 8305 + }, + { + "epoch": 0.81, + "learning_rate": 1.661e-05, + "loss": 0.1667, + "step": 8310 + }, + { + "epoch": 0.81, + "learning_rate": 1.6620000000000004e-05, + "loss": 0.1627, + "step": 8315 + }, + { + "epoch": 0.81, + "learning_rate": 1.6630000000000002e-05, + "loss": 0.2055, + "step": 8320 + }, + { + "epoch": 0.81, + "learning_rate": 1.664e-05, + "loss": 0.171, + "step": 8325 + }, + { + "epoch": 0.81, + "learning_rate": 1.665e-05, + "loss": 0.1481, + "step": 8330 + }, + { + "epoch": 0.82, + "learning_rate": 1.666e-05, + "loss": 0.2108, + "step": 8335 + }, + { + "epoch": 0.82, + "learning_rate": 1.667e-05, + "loss": 0.1637, + "step": 8340 + }, + { + "epoch": 0.82, + "learning_rate": 1.6680000000000003e-05, + "loss": 0.1681, + "step": 8345 + }, + { + "epoch": 0.82, + "learning_rate": 1.669e-05, + "loss": 0.1721, + "step": 8350 + }, + { + "epoch": 0.82, + "learning_rate": 1.67e-05, + "loss": 0.1722, + "step": 8355 + }, + { + "epoch": 0.82, + "learning_rate": 1.671e-05, + "loss": 0.1515, + "step": 8360 + }, + { + "epoch": 0.82, + "learning_rate": 1.672e-05, + "loss": 0.1904, + "step": 8365 + }, + { + "epoch": 0.82, + "learning_rate": 1.673e-05, + "loss": 0.1965, + "step": 8370 + }, + { + "epoch": 0.82, + "learning_rate": 1.6740000000000002e-05, + "loss": 0.1546, + "step": 8375 + }, + { + "epoch": 0.82, + "learning_rate": 1.675e-05, + "loss": 0.15, + "step": 8380 + }, + { + "epoch": 0.82, + "learning_rate": 1.676e-05, + "loss": 0.1888, + "step": 8385 + }, + { + "epoch": 0.82, + "learning_rate": 1.677e-05, + "loss": 0.1522, + "step": 8390 + }, + { + "epoch": 0.82, + "learning_rate": 1.6780000000000002e-05, + "loss": 0.1498, + "step": 8395 + }, + { + "epoch": 0.82, + "learning_rate": 1.679e-05, + "loss": 0.1862, + "step": 8400 + }, + { + "epoch": 0.82, + "learning_rate": 1.6800000000000002e-05, + "loss": 0.1986, + "step": 8405 + }, + { + "epoch": 0.82, + "learning_rate": 1.681e-05, + "loss": 0.1658, + "step": 8410 + }, + { + "epoch": 0.82, + "learning_rate": 1.6819999999999998e-05, + "loss": 0.1541, + "step": 8415 + }, + { + "epoch": 0.82, + "learning_rate": 1.6830000000000003e-05, + "loss": 0.1975, + "step": 8420 + }, + { + "epoch": 0.82, + "learning_rate": 1.684e-05, + "loss": 0.1435, + "step": 8425 + }, + { + "epoch": 0.82, + "learning_rate": 1.685e-05, + "loss": 0.1376, + "step": 8430 + }, + { + "epoch": 0.82, + "learning_rate": 1.686e-05, + "loss": 0.2128, + "step": 8435 + }, + { + "epoch": 0.83, + "learning_rate": 1.687e-05, + "loss": 0.1742, + "step": 8440 + }, + { + "epoch": 0.83, + "learning_rate": 1.688e-05, + "loss": 0.1605, + "step": 8445 + }, + { + "epoch": 0.83, + "learning_rate": 1.689e-05, + "loss": 0.1901, + "step": 8450 + }, + { + "epoch": 0.83, + "learning_rate": 1.69e-05, + "loss": 0.1672, + "step": 8455 + }, + { + "epoch": 0.83, + "learning_rate": 1.691e-05, + "loss": 0.1576, + "step": 8460 + }, + { + "epoch": 0.83, + "learning_rate": 1.6919999999999997e-05, + "loss": 0.1978, + "step": 8465 + }, + { + "epoch": 0.83, + "learning_rate": 1.6930000000000002e-05, + "loss": 0.2051, + "step": 8470 + }, + { + "epoch": 0.83, + "learning_rate": 1.694e-05, + "loss": 0.1681, + "step": 8475 + }, + { + "epoch": 0.83, + "learning_rate": 1.695e-05, + "loss": 0.1441, + "step": 8480 + }, + { + "epoch": 0.83, + "learning_rate": 1.696e-05, + "loss": 0.1789, + "step": 8485 + }, + { + "epoch": 0.83, + "learning_rate": 1.697e-05, + "loss": 0.155, + "step": 8490 + }, + { + "epoch": 0.83, + "learning_rate": 1.698e-05, + "loss": 0.1603, + "step": 8495 + }, + { + "epoch": 0.83, + "learning_rate": 1.699e-05, + "loss": 0.1776, + "step": 8500 + }, + { + "epoch": 0.83, + "eval_cer": 0.06634202062103586, + "eval_loss": 0.2983554005622864, + "eval_runtime": 274.8616, + "eval_samples_per_second": 59.557, + "eval_steps_per_second": 1.655, + "eval_wer": 0.17419013601666417, + "step": 8500 + }, + { + "epoch": 0.83, + "learning_rate": 1.7e-05, + "loss": 0.1777, + "step": 8505 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009999999999998e-05, + "loss": 0.1602, + "step": 8510 + }, + { + "epoch": 0.83, + "learning_rate": 1.702e-05, + "loss": 0.1964, + "step": 8515 + }, + { + "epoch": 0.83, + "learning_rate": 1.703e-05, + "loss": 0.1919, + "step": 8520 + }, + { + "epoch": 0.83, + "learning_rate": 1.704e-05, + "loss": 0.159, + "step": 8525 + }, + { + "epoch": 0.83, + "learning_rate": 1.705e-05, + "loss": 0.1685, + "step": 8530 + }, + { + "epoch": 0.83, + "learning_rate": 1.706e-05, + "loss": 0.167, + "step": 8535 + }, + { + "epoch": 0.84, + "learning_rate": 1.7069999999999998e-05, + "loss": 0.1736, + "step": 8540 + }, + { + "epoch": 0.84, + "learning_rate": 1.7080000000000002e-05, + "loss": 0.1462, + "step": 8545 + }, + { + "epoch": 0.84, + "learning_rate": 1.709e-05, + "loss": 0.1918, + "step": 8550 + }, + { + "epoch": 0.84, + "learning_rate": 1.71e-05, + "loss": 0.2091, + "step": 8555 + }, + { + "epoch": 0.84, + "learning_rate": 1.711e-05, + "loss": 0.1494, + "step": 8560 + }, + { + "epoch": 0.84, + "learning_rate": 1.712e-05, + "loss": 0.1634, + "step": 8565 + }, + { + "epoch": 0.84, + "learning_rate": 1.713e-05, + "loss": 0.1647, + "step": 8570 + }, + { + "epoch": 0.84, + "learning_rate": 1.7140000000000002e-05, + "loss": 0.1746, + "step": 8575 + }, + { + "epoch": 0.84, + "learning_rate": 1.715e-05, + "loss": 0.1539, + "step": 8580 + }, + { + "epoch": 0.84, + "learning_rate": 1.716e-05, + "loss": 0.1872, + "step": 8585 + }, + { + "epoch": 0.84, + "learning_rate": 1.717e-05, + "loss": 0.1763, + "step": 8590 + }, + { + "epoch": 0.84, + "learning_rate": 1.718e-05, + "loss": 0.1519, + "step": 8595 + }, + { + "epoch": 0.84, + "learning_rate": 1.719e-05, + "loss": 0.2006, + "step": 8600 + }, + { + "epoch": 0.84, + "learning_rate": 1.72e-05, + "loss": 0.1742, + "step": 8605 + }, + { + "epoch": 0.84, + "learning_rate": 1.721e-05, + "loss": 0.1623, + "step": 8610 + }, + { + "epoch": 0.84, + "learning_rate": 1.7219999999999998e-05, + "loss": 0.1644, + "step": 8615 + }, + { + "epoch": 0.84, + "learning_rate": 1.7230000000000003e-05, + "loss": 0.2063, + "step": 8620 + }, + { + "epoch": 0.84, + "learning_rate": 1.724e-05, + "loss": 0.1566, + "step": 8625 + }, + { + "epoch": 0.84, + "learning_rate": 1.725e-05, + "loss": 0.1802, + "step": 8630 + }, + { + "epoch": 0.84, + "learning_rate": 1.726e-05, + "loss": 0.2086, + "step": 8635 + }, + { + "epoch": 0.84, + "learning_rate": 1.727e-05, + "loss": 0.1659, + "step": 8640 + }, + { + "epoch": 0.85, + "learning_rate": 1.728e-05, + "loss": 0.1551, + "step": 8645 + }, + { + "epoch": 0.85, + "learning_rate": 1.7290000000000002e-05, + "loss": 0.1877, + "step": 8650 + }, + { + "epoch": 0.85, + "learning_rate": 1.73e-05, + "loss": 0.1815, + "step": 8655 + }, + { + "epoch": 0.85, + "learning_rate": 1.731e-05, + "loss": 0.1599, + "step": 8660 + }, + { + "epoch": 0.85, + "learning_rate": 1.732e-05, + "loss": 0.1593, + "step": 8665 + }, + { + "epoch": 0.85, + "learning_rate": 1.7330000000000002e-05, + "loss": 0.1852, + "step": 8670 + }, + { + "epoch": 0.85, + "learning_rate": 1.734e-05, + "loss": 0.1572, + "step": 8675 + }, + { + "epoch": 0.85, + "learning_rate": 1.735e-05, + "loss": 0.1566, + "step": 8680 + }, + { + "epoch": 0.85, + "learning_rate": 1.736e-05, + "loss": 0.186, + "step": 8685 + }, + { + "epoch": 0.85, + "learning_rate": 1.7369999999999998e-05, + "loss": 0.1764, + "step": 8690 + }, + { + "epoch": 0.85, + "learning_rate": 1.7380000000000003e-05, + "loss": 0.1531, + "step": 8695 + }, + { + "epoch": 0.85, + "learning_rate": 1.739e-05, + "loss": 0.1553, + "step": 8700 + }, + { + "epoch": 0.85, + "learning_rate": 1.74e-05, + "loss": 0.1999, + "step": 8705 + }, + { + "epoch": 0.85, + "learning_rate": 1.741e-05, + "loss": 0.1321, + "step": 8710 + }, + { + "epoch": 0.85, + "learning_rate": 1.742e-05, + "loss": 0.1733, + "step": 8715 + }, + { + "epoch": 0.85, + "learning_rate": 1.743e-05, + "loss": 0.1838, + "step": 8720 + }, + { + "epoch": 0.85, + "learning_rate": 1.7440000000000002e-05, + "loss": 0.159, + "step": 8725 + }, + { + "epoch": 0.85, + "learning_rate": 1.745e-05, + "loss": 0.1681, + "step": 8730 + }, + { + "epoch": 0.85, + "learning_rate": 1.746e-05, + "loss": 0.2065, + "step": 8735 + }, + { + "epoch": 0.85, + "learning_rate": 1.747e-05, + "loss": 0.161, + "step": 8740 + }, + { + "epoch": 0.86, + "learning_rate": 1.7480000000000002e-05, + "loss": 0.152, + "step": 8745 + }, + { + "epoch": 0.86, + "learning_rate": 1.749e-05, + "loss": 0.1665, + "step": 8750 + }, + { + "epoch": 0.86, + "learning_rate": 1.7500000000000002e-05, + "loss": 0.1782, + "step": 8755 + }, + { + "epoch": 0.86, + "learning_rate": 1.751e-05, + "loss": 0.1498, + "step": 8760 + }, + { + "epoch": 0.86, + "learning_rate": 1.7519999999999998e-05, + "loss": 0.1792, + "step": 8765 + }, + { + "epoch": 0.86, + "learning_rate": 1.7530000000000003e-05, + "loss": 0.1979, + "step": 8770 + }, + { + "epoch": 0.86, + "learning_rate": 1.754e-05, + "loss": 0.1684, + "step": 8775 + }, + { + "epoch": 0.86, + "learning_rate": 1.755e-05, + "loss": 0.161, + "step": 8780 + }, + { + "epoch": 0.86, + "learning_rate": 1.756e-05, + "loss": 0.1809, + "step": 8785 + }, + { + "epoch": 0.86, + "learning_rate": 1.757e-05, + "loss": 0.1516, + "step": 8790 + }, + { + "epoch": 0.86, + "learning_rate": 1.758e-05, + "loss": 0.1739, + "step": 8795 + }, + { + "epoch": 0.86, + "learning_rate": 1.7590000000000003e-05, + "loss": 0.1652, + "step": 8800 + }, + { + "epoch": 0.86, + "learning_rate": 1.76e-05, + "loss": 0.1877, + "step": 8805 + }, + { + "epoch": 0.86, + "learning_rate": 1.761e-05, + "loss": 0.1776, + "step": 8810 + }, + { + "epoch": 0.86, + "learning_rate": 1.762e-05, + "loss": 0.1654, + "step": 8815 + }, + { + "epoch": 0.86, + "learning_rate": 1.763e-05, + "loss": 0.1811, + "step": 8820 + }, + { + "epoch": 0.86, + "learning_rate": 1.764e-05, + "loss": 0.1562, + "step": 8825 + }, + { + "epoch": 0.86, + "learning_rate": 1.7650000000000002e-05, + "loss": 0.173, + "step": 8830 + }, + { + "epoch": 0.86, + "learning_rate": 1.766e-05, + "loss": 0.1912, + "step": 8835 + }, + { + "epoch": 0.86, + "learning_rate": 1.767e-05, + "loss": 0.1647, + "step": 8840 + }, + { + "epoch": 0.86, + "learning_rate": 1.768e-05, + "loss": 0.1522, + "step": 8845 + }, + { + "epoch": 0.87, + "learning_rate": 1.7690000000000002e-05, + "loss": 0.1992, + "step": 8850 + }, + { + "epoch": 0.87, + "learning_rate": 1.77e-05, + "loss": 0.1975, + "step": 8855 + }, + { + "epoch": 0.87, + "learning_rate": 1.771e-05, + "loss": 0.1667, + "step": 8860 + }, + { + "epoch": 0.87, + "learning_rate": 1.772e-05, + "loss": 0.1604, + "step": 8865 + }, + { + "epoch": 0.87, + "learning_rate": 1.7728e-05, + "loss": 0.2078, + "step": 8870 + }, + { + "epoch": 0.87, + "learning_rate": 1.7738000000000002e-05, + "loss": 0.1605, + "step": 8875 + }, + { + "epoch": 0.87, + "learning_rate": 1.7748e-05, + "loss": 0.1809, + "step": 8880 + }, + { + "epoch": 0.87, + "learning_rate": 1.7758e-05, + "loss": 0.2118, + "step": 8885 + }, + { + "epoch": 0.87, + "learning_rate": 1.7768000000000003e-05, + "loss": 0.1843, + "step": 8890 + }, + { + "epoch": 0.87, + "learning_rate": 1.7778e-05, + "loss": 0.151, + "step": 8895 + }, + { + "epoch": 0.87, + "learning_rate": 1.7788e-05, + "loss": 0.1815, + "step": 8900 + }, + { + "epoch": 0.87, + "learning_rate": 1.7798e-05, + "loss": 0.1899, + "step": 8905 + }, + { + "epoch": 0.87, + "learning_rate": 1.7808e-05, + "loss": 0.1533, + "step": 8910 + }, + { + "epoch": 0.87, + "learning_rate": 1.7818e-05, + "loss": 0.1637, + "step": 8915 + }, + { + "epoch": 0.87, + "learning_rate": 1.7828000000000003e-05, + "loss": 0.1882, + "step": 8920 + }, + { + "epoch": 0.87, + "learning_rate": 1.7838e-05, + "loss": 0.1421, + "step": 8925 + }, + { + "epoch": 0.87, + "learning_rate": 1.7848e-05, + "loss": 0.1341, + "step": 8930 + }, + { + "epoch": 0.87, + "learning_rate": 1.7858e-05, + "loss": 0.1885, + "step": 8935 + }, + { + "epoch": 0.87, + "learning_rate": 1.7868000000000002e-05, + "loss": 0.1407, + "step": 8940 + }, + { + "epoch": 0.87, + "learning_rate": 1.7878e-05, + "loss": 0.1543, + "step": 8945 + }, + { + "epoch": 0.88, + "learning_rate": 1.7888e-05, + "loss": 0.1651, + "step": 8950 + }, + { + "epoch": 0.88, + "learning_rate": 1.7898e-05, + "loss": 0.1662, + "step": 8955 + }, + { + "epoch": 0.88, + "learning_rate": 1.7908e-05, + "loss": 0.15, + "step": 8960 + }, + { + "epoch": 0.88, + "learning_rate": 1.7918e-05, + "loss": 0.1604, + "step": 8965 + }, + { + "epoch": 0.88, + "learning_rate": 1.7928000000000002e-05, + "loss": 0.1779, + "step": 8970 + }, + { + "epoch": 0.88, + "learning_rate": 1.7938e-05, + "loss": 0.1454, + "step": 8975 + }, + { + "epoch": 0.88, + "learning_rate": 1.7947999999999998e-05, + "loss": 0.1351, + "step": 8980 + }, + { + "epoch": 0.88, + "learning_rate": 1.7958e-05, + "loss": 0.1695, + "step": 8985 + }, + { + "epoch": 0.88, + "learning_rate": 1.7968e-05, + "loss": 0.1615, + "step": 8990 + }, + { + "epoch": 0.88, + "learning_rate": 1.7978e-05, + "loss": 0.1415, + "step": 8995 + }, + { + "epoch": 0.88, + "learning_rate": 1.7986e-05, + "loss": 0.151, + "step": 9000 + }, + { + "epoch": 0.88, + "eval_cer": 0.065091069690222, + "eval_loss": 0.30274277925491333, + "eval_runtime": 276.1668, + "eval_samples_per_second": 59.276, + "eval_steps_per_second": 1.648, + "eval_wer": 0.1706640199029665, + "step": 9000 + }, + { + "epoch": 0.88, + "learning_rate": 1.7996000000000002e-05, + "loss": 0.1805, + "step": 9005 + }, + { + "epoch": 0.88, + "learning_rate": 1.8006e-05, + "loss": 0.1394, + "step": 9010 + }, + { + "epoch": 0.88, + "learning_rate": 1.8016e-05, + "loss": 0.1663, + "step": 9015 + }, + { + "epoch": 0.88, + "learning_rate": 1.8026e-05, + "loss": 0.1932, + "step": 9020 + }, + { + "epoch": 0.88, + "learning_rate": 1.8035999999999998e-05, + "loss": 0.1572, + "step": 9025 + }, + { + "epoch": 0.88, + "learning_rate": 1.8046000000000003e-05, + "loss": 0.1675, + "step": 9030 + }, + { + "epoch": 0.88, + "learning_rate": 1.8056e-05, + "loss": 0.1848, + "step": 9035 + }, + { + "epoch": 0.88, + "learning_rate": 1.8066e-05, + "loss": 0.1544, + "step": 9040 + }, + { + "epoch": 0.88, + "learning_rate": 1.8076e-05, + "loss": 0.1529, + "step": 9045 + }, + { + "epoch": 0.88, + "learning_rate": 1.8086e-05, + "loss": 0.1607, + "step": 9050 + }, + { + "epoch": 0.89, + "learning_rate": 1.8096e-05, + "loss": 0.1787, + "step": 9055 + }, + { + "epoch": 0.89, + "learning_rate": 1.8106000000000002e-05, + "loss": 0.1563, + "step": 9060 + }, + { + "epoch": 0.89, + "learning_rate": 1.8116e-05, + "loss": 0.1807, + "step": 9065 + }, + { + "epoch": 0.89, + "learning_rate": 1.8126e-05, + "loss": 0.1752, + "step": 9070 + }, + { + "epoch": 0.89, + "learning_rate": 1.8136e-05, + "loss": 0.1536, + "step": 9075 + }, + { + "epoch": 0.89, + "learning_rate": 1.8146e-05, + "loss": 0.1565, + "step": 9080 + }, + { + "epoch": 0.89, + "learning_rate": 1.8156e-05, + "loss": 0.194, + "step": 9085 + }, + { + "epoch": 0.89, + "learning_rate": 1.8166000000000002e-05, + "loss": 0.1546, + "step": 9090 + }, + { + "epoch": 0.89, + "learning_rate": 1.8176e-05, + "loss": 0.168, + "step": 9095 + }, + { + "epoch": 0.89, + "learning_rate": 1.8186e-05, + "loss": 0.1581, + "step": 9100 + }, + { + "epoch": 0.89, + "learning_rate": 1.8196e-05, + "loss": 0.1843, + "step": 9105 + }, + { + "epoch": 0.89, + "learning_rate": 1.8206e-05, + "loss": 0.1483, + "step": 9110 + }, + { + "epoch": 0.89, + "learning_rate": 1.8216e-05, + "loss": 0.1655, + "step": 9115 + }, + { + "epoch": 0.89, + "learning_rate": 1.8226e-05, + "loss": 0.2082, + "step": 9120 + }, + { + "epoch": 0.89, + "learning_rate": 1.8236e-05, + "loss": 0.1498, + "step": 9125 + }, + { + "epoch": 0.89, + "learning_rate": 1.8245999999999998e-05, + "loss": 0.1662, + "step": 9130 + }, + { + "epoch": 0.89, + "learning_rate": 1.8256000000000003e-05, + "loss": 0.1886, + "step": 9135 + }, + { + "epoch": 0.89, + "learning_rate": 1.8266e-05, + "loss": 0.1599, + "step": 9140 + }, + { + "epoch": 0.89, + "learning_rate": 1.8276e-05, + "loss": 0.153, + "step": 9145 + }, + { + "epoch": 0.89, + "learning_rate": 1.8286e-05, + "loss": 0.175, + "step": 9150 + }, + { + "epoch": 0.9, + "learning_rate": 1.8296e-05, + "loss": 0.1666, + "step": 9155 + }, + { + "epoch": 0.9, + "learning_rate": 1.8306e-05, + "loss": 0.1467, + "step": 9160 + }, + { + "epoch": 0.9, + "learning_rate": 1.8316000000000002e-05, + "loss": 0.1637, + "step": 9165 + }, + { + "epoch": 0.9, + "learning_rate": 1.8326e-05, + "loss": 0.1956, + "step": 9170 + }, + { + "epoch": 0.9, + "learning_rate": 1.8336e-05, + "loss": 0.1628, + "step": 9175 + }, + { + "epoch": 0.9, + "learning_rate": 1.8346e-05, + "loss": 0.1482, + "step": 9180 + }, + { + "epoch": 0.9, + "learning_rate": 1.8356000000000002e-05, + "loss": 0.1751, + "step": 9185 + }, + { + "epoch": 0.9, + "learning_rate": 1.8366e-05, + "loss": 0.1589, + "step": 9190 + }, + { + "epoch": 0.9, + "learning_rate": 1.8376e-05, + "loss": 0.1469, + "step": 9195 + }, + { + "epoch": 0.9, + "learning_rate": 1.8386e-05, + "loss": 0.1856, + "step": 9200 + }, + { + "epoch": 0.9, + "learning_rate": 1.8395999999999998e-05, + "loss": 0.1696, + "step": 9205 + }, + { + "epoch": 0.9, + "learning_rate": 1.8406000000000003e-05, + "loss": 0.1576, + "step": 9210 + }, + { + "epoch": 0.9, + "learning_rate": 1.8416e-05, + "loss": 0.1762, + "step": 9215 + }, + { + "epoch": 0.9, + "learning_rate": 1.8426e-05, + "loss": 0.1864, + "step": 9220 + }, + { + "epoch": 0.9, + "learning_rate": 1.8436e-05, + "loss": 0.1554, + "step": 9225 + }, + { + "epoch": 0.9, + "learning_rate": 1.8446e-05, + "loss": 0.1521, + "step": 9230 + }, + { + "epoch": 0.9, + "learning_rate": 1.8456e-05, + "loss": 0.2108, + "step": 9235 + }, + { + "epoch": 0.9, + "learning_rate": 1.8466000000000002e-05, + "loss": 0.1479, + "step": 9240 + }, + { + "epoch": 0.9, + "learning_rate": 1.8476e-05, + "loss": 0.1618, + "step": 9245 + }, + { + "epoch": 0.9, + "learning_rate": 1.8486e-05, + "loss": 0.1685, + "step": 9250 + }, + { + "epoch": 0.9, + "learning_rate": 1.8496e-05, + "loss": 0.163, + "step": 9255 + }, + { + "epoch": 0.91, + "learning_rate": 1.8506000000000002e-05, + "loss": 0.1416, + "step": 9260 + }, + { + "epoch": 0.91, + "learning_rate": 1.8516e-05, + "loss": 0.1737, + "step": 9265 + }, + { + "epoch": 0.91, + "learning_rate": 1.8526000000000002e-05, + "loss": 0.2091, + "step": 9270 + }, + { + "epoch": 0.91, + "learning_rate": 1.8536e-05, + "loss": 0.1614, + "step": 9275 + }, + { + "epoch": 0.91, + "learning_rate": 1.8545999999999998e-05, + "loss": 0.1496, + "step": 9280 + }, + { + "epoch": 0.91, + "learning_rate": 1.8556000000000003e-05, + "loss": 0.1735, + "step": 9285 + }, + { + "epoch": 0.91, + "learning_rate": 1.8566e-05, + "loss": 0.1599, + "step": 9290 + }, + { + "epoch": 0.91, + "learning_rate": 1.8576e-05, + "loss": 0.1546, + "step": 9295 + }, + { + "epoch": 0.91, + "learning_rate": 1.8586e-05, + "loss": 0.1801, + "step": 9300 + }, + { + "epoch": 0.91, + "learning_rate": 1.8596e-05, + "loss": 0.1676, + "step": 9305 + }, + { + "epoch": 0.91, + "learning_rate": 1.8606e-05, + "loss": 0.1441, + "step": 9310 + }, + { + "epoch": 0.91, + "learning_rate": 1.8616000000000003e-05, + "loss": 0.1741, + "step": 9315 + }, + { + "epoch": 0.91, + "learning_rate": 1.8626e-05, + "loss": 0.1988, + "step": 9320 + }, + { + "epoch": 0.91, + "learning_rate": 1.8636e-05, + "loss": 0.1575, + "step": 9325 + }, + { + "epoch": 0.91, + "learning_rate": 1.8646e-05, + "loss": 0.1443, + "step": 9330 + }, + { + "epoch": 0.91, + "learning_rate": 1.8656000000000002e-05, + "loss": 0.199, + "step": 9335 + }, + { + "epoch": 0.91, + "learning_rate": 1.8666e-05, + "loss": 0.1651, + "step": 9340 + }, + { + "epoch": 0.91, + "learning_rate": 1.8676000000000002e-05, + "loss": 0.1624, + "step": 9345 + }, + { + "epoch": 0.91, + "learning_rate": 1.8686e-05, + "loss": 0.1716, + "step": 9350 + }, + { + "epoch": 0.91, + "learning_rate": 1.8696e-05, + "loss": 0.167, + "step": 9355 + }, + { + "epoch": 0.92, + "learning_rate": 1.8706000000000004e-05, + "loss": 0.1524, + "step": 9360 + }, + { + "epoch": 0.92, + "learning_rate": 1.8716000000000002e-05, + "loss": 0.1571, + "step": 9365 + }, + { + "epoch": 0.92, + "learning_rate": 1.8726e-05, + "loss": 0.1738, + "step": 9370 + }, + { + "epoch": 0.92, + "learning_rate": 1.8736e-05, + "loss": 0.1395, + "step": 9375 + }, + { + "epoch": 0.92, + "learning_rate": 1.8746e-05, + "loss": 0.1556, + "step": 9380 + }, + { + "epoch": 0.92, + "learning_rate": 1.8756e-05, + "loss": 0.1813, + "step": 9385 + }, + { + "epoch": 0.92, + "learning_rate": 1.8766000000000003e-05, + "loss": 0.1612, + "step": 9390 + }, + { + "epoch": 0.92, + "learning_rate": 1.8776e-05, + "loss": 0.1369, + "step": 9395 + }, + { + "epoch": 0.92, + "learning_rate": 1.8786e-05, + "loss": 0.2, + "step": 9400 + }, + { + "epoch": 0.92, + "learning_rate": 1.8796e-05, + "loss": 0.1688, + "step": 9405 + }, + { + "epoch": 0.92, + "learning_rate": 1.8806000000000003e-05, + "loss": 0.161, + "step": 9410 + }, + { + "epoch": 0.92, + "learning_rate": 1.8816e-05, + "loss": 0.195, + "step": 9415 + }, + { + "epoch": 0.92, + "learning_rate": 1.8826000000000002e-05, + "loss": 0.1834, + "step": 9420 + }, + { + "epoch": 0.92, + "learning_rate": 1.8836e-05, + "loss": 0.1676, + "step": 9425 + }, + { + "epoch": 0.92, + "learning_rate": 1.8846e-05, + "loss": 0.1501, + "step": 9430 + }, + { + "epoch": 0.92, + "learning_rate": 1.8856000000000004e-05, + "loss": 0.1998, + "step": 9435 + }, + { + "epoch": 0.92, + "learning_rate": 1.8866000000000002e-05, + "loss": 0.1754, + "step": 9440 + }, + { + "epoch": 0.92, + "learning_rate": 1.8876e-05, + "loss": 0.1461, + "step": 9445 + }, + { + "epoch": 0.92, + "learning_rate": 1.8886e-05, + "loss": 0.1728, + "step": 9450 + }, + { + "epoch": 0.92, + "learning_rate": 1.8896e-05, + "loss": 0.1689, + "step": 9455 + }, + { + "epoch": 0.93, + "learning_rate": 1.8906e-05, + "loss": 0.161, + "step": 9460 + }, + { + "epoch": 0.93, + "learning_rate": 1.8916e-05, + "loss": 0.159, + "step": 9465 + }, + { + "epoch": 0.93, + "learning_rate": 1.8926e-05, + "loss": 0.1832, + "step": 9470 + }, + { + "epoch": 0.93, + "learning_rate": 1.8936e-05, + "loss": 0.1426, + "step": 9475 + }, + { + "epoch": 0.93, + "learning_rate": 1.8945999999999998e-05, + "loss": 0.1557, + "step": 9480 + }, + { + "epoch": 0.93, + "learning_rate": 1.8956e-05, + "loss": 0.1531, + "step": 9485 + }, + { + "epoch": 0.93, + "learning_rate": 1.8966e-05, + "loss": 0.1631, + "step": 9490 + }, + { + "epoch": 0.93, + "learning_rate": 1.8976e-05, + "loss": 0.1257, + "step": 9495 + }, + { + "epoch": 0.93, + "learning_rate": 1.8986e-05, + "loss": 0.1609, + "step": 9500 + }, + { + "epoch": 0.93, + "eval_cer": 0.06672470524035137, + "eval_loss": 0.3000984787940979, + "eval_runtime": 276.249, + "eval_samples_per_second": 59.258, + "eval_steps_per_second": 1.647, + "eval_wer": 0.17380487518201942, + "step": 9500 + }, + { + "epoch": 0.93, + "learning_rate": 1.8996e-05, + "loss": 0.1829, + "step": 9505 + }, + { + "epoch": 0.93, + "learning_rate": 1.9005999999999997e-05, + "loss": 0.1591, + "step": 9510 + }, + { + "epoch": 0.93, + "learning_rate": 1.9016000000000002e-05, + "loss": 0.1617, + "step": 9515 + }, + { + "epoch": 0.93, + "learning_rate": 1.9026e-05, + "loss": 0.1863, + "step": 9520 + }, + { + "epoch": 0.93, + "learning_rate": 1.9036e-05, + "loss": 0.1544, + "step": 9525 + }, + { + "epoch": 0.93, + "learning_rate": 1.9046e-05, + "loss": 0.1544, + "step": 9530 + }, + { + "epoch": 0.93, + "learning_rate": 1.9056e-05, + "loss": 0.2044, + "step": 9535 + }, + { + "epoch": 0.93, + "learning_rate": 1.9066e-05, + "loss": 0.1768, + "step": 9540 + }, + { + "epoch": 0.93, + "learning_rate": 1.9076e-05, + "loss": 0.1626, + "step": 9545 + }, + { + "epoch": 0.93, + "learning_rate": 1.9086e-05, + "loss": 0.1526, + "step": 9550 + }, + { + "epoch": 0.93, + "learning_rate": 1.9095999999999998e-05, + "loss": 0.1741, + "step": 9555 + }, + { + "epoch": 0.93, + "learning_rate": 1.9106e-05, + "loss": 0.1548, + "step": 9560 + }, + { + "epoch": 0.94, + "learning_rate": 1.9116e-05, + "loss": 0.1639, + "step": 9565 + }, + { + "epoch": 0.94, + "learning_rate": 1.9126e-05, + "loss": 0.1874, + "step": 9570 + }, + { + "epoch": 0.94, + "learning_rate": 1.9136e-05, + "loss": 0.141, + "step": 9575 + }, + { + "epoch": 0.94, + "learning_rate": 1.9146e-05, + "loss": 0.1503, + "step": 9580 + }, + { + "epoch": 0.94, + "learning_rate": 1.9155999999999998e-05, + "loss": 0.215, + "step": 9585 + }, + { + "epoch": 0.94, + "learning_rate": 1.9166000000000003e-05, + "loss": 0.1674, + "step": 9590 + }, + { + "epoch": 0.94, + "learning_rate": 1.9176e-05, + "loss": 0.1492, + "step": 9595 + }, + { + "epoch": 0.94, + "learning_rate": 1.9186e-05, + "loss": 0.1767, + "step": 9600 + }, + { + "epoch": 0.94, + "learning_rate": 1.9196e-05, + "loss": 0.1629, + "step": 9605 + }, + { + "epoch": 0.94, + "learning_rate": 1.9206e-05, + "loss": 0.1544, + "step": 9610 + }, + { + "epoch": 0.94, + "learning_rate": 1.9216e-05, + "loss": 0.1561, + "step": 9615 + }, + { + "epoch": 0.94, + "learning_rate": 1.9226000000000002e-05, + "loss": 0.188, + "step": 9620 + }, + { + "epoch": 0.94, + "learning_rate": 1.9236e-05, + "loss": 0.149, + "step": 9625 + }, + { + "epoch": 0.94, + "learning_rate": 1.9246e-05, + "loss": 0.1573, + "step": 9630 + }, + { + "epoch": 0.94, + "learning_rate": 1.9256e-05, + "loss": 0.1791, + "step": 9635 + }, + { + "epoch": 0.94, + "learning_rate": 1.9266e-05, + "loss": 0.153, + "step": 9640 + }, + { + "epoch": 0.94, + "learning_rate": 1.9276e-05, + "loss": 0.1526, + "step": 9645 + }, + { + "epoch": 0.94, + "learning_rate": 1.9286e-05, + "loss": 0.1757, + "step": 9650 + }, + { + "epoch": 0.94, + "learning_rate": 1.9296e-05, + "loss": 0.1914, + "step": 9655 + }, + { + "epoch": 0.94, + "learning_rate": 1.9305999999999998e-05, + "loss": 0.1477, + "step": 9660 + }, + { + "epoch": 0.95, + "learning_rate": 1.9316000000000003e-05, + "loss": 0.1718, + "step": 9665 + }, + { + "epoch": 0.95, + "learning_rate": 1.9326e-05, + "loss": 0.2031, + "step": 9670 + }, + { + "epoch": 0.95, + "learning_rate": 1.9336e-05, + "loss": 0.1651, + "step": 9675 + }, + { + "epoch": 0.95, + "learning_rate": 1.9346e-05, + "loss": 0.1444, + "step": 9680 + }, + { + "epoch": 0.95, + "learning_rate": 1.9356e-05, + "loss": 0.185, + "step": 9685 + }, + { + "epoch": 0.95, + "learning_rate": 1.9366e-05, + "loss": 0.1578, + "step": 9690 + }, + { + "epoch": 0.95, + "learning_rate": 1.9376000000000002e-05, + "loss": 0.1647, + "step": 9695 + }, + { + "epoch": 0.95, + "learning_rate": 1.9386e-05, + "loss": 0.1722, + "step": 9700 + }, + { + "epoch": 0.95, + "learning_rate": 1.9396e-05, + "loss": 0.1868, + "step": 9705 + }, + { + "epoch": 0.95, + "learning_rate": 1.9406e-05, + "loss": 0.1791, + "step": 9710 + }, + { + "epoch": 0.95, + "learning_rate": 1.9416000000000002e-05, + "loss": 0.1427, + "step": 9715 + }, + { + "epoch": 0.95, + "learning_rate": 1.9426e-05, + "loss": 0.1986, + "step": 9720 + }, + { + "epoch": 0.95, + "learning_rate": 1.9436e-05, + "loss": 0.1506, + "step": 9725 + }, + { + "epoch": 0.95, + "learning_rate": 1.9446e-05, + "loss": 0.1474, + "step": 9730 + }, + { + "epoch": 0.95, + "learning_rate": 1.9455999999999998e-05, + "loss": 0.1916, + "step": 9735 + }, + { + "epoch": 0.95, + "learning_rate": 1.9466000000000003e-05, + "loss": 0.1365, + "step": 9740 + }, + { + "epoch": 0.95, + "learning_rate": 1.9476e-05, + "loss": 0.1557, + "step": 9745 + }, + { + "epoch": 0.95, + "learning_rate": 1.9486e-05, + "loss": 0.1662, + "step": 9750 + }, + { + "epoch": 0.95, + "learning_rate": 1.9496e-05, + "loss": 0.1862, + "step": 9755 + }, + { + "epoch": 0.95, + "learning_rate": 1.9506e-05, + "loss": 0.1469, + "step": 9760 + }, + { + "epoch": 0.95, + "learning_rate": 1.9516e-05, + "loss": 0.1418, + "step": 9765 + }, + { + "epoch": 0.96, + "learning_rate": 1.9526000000000002e-05, + "loss": 0.179, + "step": 9770 + }, + { + "epoch": 0.96, + "learning_rate": 1.9536e-05, + "loss": 0.1522, + "step": 9775 + }, + { + "epoch": 0.96, + "learning_rate": 1.9546e-05, + "loss": 0.1858, + "step": 9780 + }, + { + "epoch": 0.96, + "learning_rate": 1.9556e-05, + "loss": 0.183, + "step": 9785 + }, + { + "epoch": 0.96, + "learning_rate": 1.9566000000000002e-05, + "loss": 0.1652, + "step": 9790 + }, + { + "epoch": 0.96, + "learning_rate": 1.9576e-05, + "loss": 0.165, + "step": 9795 + }, + { + "epoch": 0.96, + "learning_rate": 1.9586000000000002e-05, + "loss": 0.1898, + "step": 9800 + }, + { + "epoch": 0.96, + "learning_rate": 1.9596e-05, + "loss": 0.1605, + "step": 9805 + }, + { + "epoch": 0.96, + "learning_rate": 1.9605999999999998e-05, + "loss": 0.1454, + "step": 9810 + }, + { + "epoch": 0.96, + "learning_rate": 1.9616000000000003e-05, + "loss": 0.1733, + "step": 9815 + }, + { + "epoch": 0.96, + "learning_rate": 1.9626e-05, + "loss": 0.2042, + "step": 9820 + }, + { + "epoch": 0.96, + "learning_rate": 1.9636e-05, + "loss": 0.1677, + "step": 9825 + }, + { + "epoch": 0.96, + "learning_rate": 1.9646e-05, + "loss": 0.1709, + "step": 9830 + }, + { + "epoch": 0.96, + "learning_rate": 1.9656e-05, + "loss": 0.1714, + "step": 9835 + }, + { + "epoch": 0.96, + "learning_rate": 1.9666e-05, + "loss": 0.1623, + "step": 9840 + }, + { + "epoch": 0.96, + "learning_rate": 1.9676000000000003e-05, + "loss": 0.1589, + "step": 9845 + }, + { + "epoch": 0.96, + "learning_rate": 1.9686e-05, + "loss": 0.1793, + "step": 9850 + }, + { + "epoch": 0.96, + "learning_rate": 1.9696e-05, + "loss": 0.1848, + "step": 9855 + }, + { + "epoch": 0.96, + "learning_rate": 1.9706e-05, + "loss": 0.1521, + "step": 9860 + }, + { + "epoch": 0.96, + "learning_rate": 1.9716000000000002e-05, + "loss": 0.1724, + "step": 9865 + }, + { + "epoch": 0.97, + "learning_rate": 1.9726e-05, + "loss": 0.1865, + "step": 9870 + }, + { + "epoch": 0.97, + "learning_rate": 1.9736000000000002e-05, + "loss": 0.1467, + "step": 9875 + }, + { + "epoch": 0.97, + "learning_rate": 1.9746e-05, + "loss": 0.1588, + "step": 9880 + }, + { + "epoch": 0.97, + "learning_rate": 1.9756e-05, + "loss": 0.1811, + "step": 9885 + }, + { + "epoch": 0.97, + "learning_rate": 1.9766000000000004e-05, + "loss": 0.1653, + "step": 9890 + }, + { + "epoch": 0.97, + "learning_rate": 1.9776000000000002e-05, + "loss": 0.1563, + "step": 9895 + }, + { + "epoch": 0.97, + "learning_rate": 1.9786e-05, + "loss": 0.1893, + "step": 9900 + }, + { + "epoch": 0.97, + "learning_rate": 1.9796e-05, + "loss": 0.1739, + "step": 9905 + }, + { + "epoch": 0.97, + "learning_rate": 1.9806e-05, + "loss": 0.1427, + "step": 9910 + }, + { + "epoch": 0.97, + "learning_rate": 1.9816e-05, + "loss": 0.1705, + "step": 9915 + }, + { + "epoch": 0.97, + "learning_rate": 1.9826000000000003e-05, + "loss": 0.2113, + "step": 9920 + }, + { + "epoch": 0.97, + "learning_rate": 1.9836e-05, + "loss": 0.1394, + "step": 9925 + }, + { + "epoch": 0.97, + "learning_rate": 1.9846e-05, + "loss": 0.1644, + "step": 9930 + }, + { + "epoch": 0.97, + "learning_rate": 1.9856e-05, + "loss": 0.1776, + "step": 9935 + }, + { + "epoch": 0.97, + "learning_rate": 1.9866e-05, + "loss": 0.1404, + "step": 9940 + }, + { + "epoch": 0.97, + "learning_rate": 1.9876e-05, + "loss": 0.1678, + "step": 9945 + }, + { + "epoch": 0.97, + "learning_rate": 1.9886000000000002e-05, + "loss": 0.1786, + "step": 9950 + }, + { + "epoch": 0.97, + "learning_rate": 1.9896e-05, + "loss": 0.1836, + "step": 9955 + }, + { + "epoch": 0.97, + "learning_rate": 1.9906e-05, + "loss": 0.1647, + "step": 9960 + }, + { + "epoch": 0.97, + "learning_rate": 1.9916e-05, + "loss": 0.1612, + "step": 9965 + }, + { + "epoch": 0.97, + "learning_rate": 1.9926000000000002e-05, + "loss": 0.1927, + "step": 9970 + }, + { + "epoch": 0.98, + "learning_rate": 1.9936e-05, + "loss": 0.1521, + "step": 9975 + }, + { + "epoch": 0.98, + "learning_rate": 1.9946000000000002e-05, + "loss": 0.1548, + "step": 9980 + }, + { + "epoch": 0.98, + "learning_rate": 1.9956e-05, + "loss": 0.1957, + "step": 9985 + }, + { + "epoch": 0.98, + "learning_rate": 1.9965999999999998e-05, + "loss": 0.1573, + "step": 9990 + }, + { + "epoch": 0.98, + "learning_rate": 1.9976000000000003e-05, + "loss": 0.1328, + "step": 9995 + }, + { + "epoch": 0.98, + "learning_rate": 1.9986e-05, + "loss": 0.1735, + "step": 10000 + }, + { + "epoch": 0.98, + "eval_cer": 0.06671198762460373, + "eval_loss": 0.30074480175971985, + "eval_runtime": 274.6835, + "eval_samples_per_second": 59.596, + "eval_steps_per_second": 1.656, + "eval_wer": 0.1747582325016488, + "step": 10000 + }, + { + "epoch": 0.98, + "learning_rate": 1.9996e-05, + "loss": 0.1789, + "step": 10005 + }, + { + "epoch": 0.98, + "learning_rate": 2.0006e-05, + "loss": 0.1481, + "step": 10010 + }, + { + "epoch": 0.98, + "learning_rate": 2.0016e-05, + "loss": 0.1537, + "step": 10015 + }, + { + "epoch": 0.98, + "learning_rate": 2.0026e-05, + "loss": 0.2072, + "step": 10020 + }, + { + "epoch": 0.98, + "learning_rate": 2.0036000000000003e-05, + "loss": 0.1534, + "step": 10025 + }, + { + "epoch": 0.98, + "learning_rate": 2.0046e-05, + "loss": 0.1594, + "step": 10030 + }, + { + "epoch": 0.98, + "learning_rate": 2.0056e-05, + "loss": 0.1954, + "step": 10035 + }, + { + "epoch": 0.98, + "learning_rate": 2.0066e-05, + "loss": 0.156, + "step": 10040 + }, + { + "epoch": 0.98, + "learning_rate": 2.0076000000000002e-05, + "loss": 0.1522, + "step": 10045 + }, + { + "epoch": 0.98, + "learning_rate": 2.0086e-05, + "loss": 0.1667, + "step": 10050 + }, + { + "epoch": 0.98, + "learning_rate": 2.0096000000000002e-05, + "loss": 0.1791, + "step": 10055 + }, + { + "epoch": 0.98, + "learning_rate": 2.0106e-05, + "loss": 0.1582, + "step": 10060 + }, + { + "epoch": 0.98, + "learning_rate": 2.0116e-05, + "loss": 0.1546, + "step": 10065 + }, + { + "epoch": 0.98, + "learning_rate": 2.0126e-05, + "loss": 0.1933, + "step": 10070 + }, + { + "epoch": 0.99, + "learning_rate": 2.0136e-05, + "loss": 0.1469, + "step": 10075 + }, + { + "epoch": 0.99, + "learning_rate": 2.0146e-05, + "loss": 0.1472, + "step": 10080 + }, + { + "epoch": 0.99, + "learning_rate": 2.0155999999999998e-05, + "loss": 0.2039, + "step": 10085 + }, + { + "epoch": 0.99, + "learning_rate": 2.0166e-05, + "loss": 0.1645, + "step": 10090 + }, + { + "epoch": 0.99, + "learning_rate": 2.0176e-05, + "loss": 0.1496, + "step": 10095 + }, + { + "epoch": 0.99, + "learning_rate": 2.0186e-05, + "loss": 0.156, + "step": 10100 + }, + { + "epoch": 0.99, + "learning_rate": 2.0196e-05, + "loss": 0.1715, + "step": 10105 + }, + { + "epoch": 0.99, + "learning_rate": 2.0206e-05, + "loss": 0.1577, + "step": 10110 + }, + { + "epoch": 0.99, + "learning_rate": 2.0215999999999998e-05, + "loss": 0.167, + "step": 10115 + }, + { + "epoch": 0.99, + "learning_rate": 2.0226000000000003e-05, + "loss": 0.1893, + "step": 10120 + }, + { + "epoch": 0.99, + "learning_rate": 2.0236e-05, + "loss": 0.157, + "step": 10125 + }, + { + "epoch": 0.99, + "learning_rate": 2.0246e-05, + "loss": 0.1618, + "step": 10130 + }, + { + "epoch": 0.99, + "learning_rate": 2.0256e-05, + "loss": 0.1833, + "step": 10135 + }, + { + "epoch": 0.99, + "learning_rate": 2.0266e-05, + "loss": 0.1622, + "step": 10140 + }, + { + "epoch": 0.99, + "learning_rate": 2.0276e-05, + "loss": 0.1559, + "step": 10145 + }, + { + "epoch": 0.99, + "learning_rate": 2.0286000000000002e-05, + "loss": 0.1697, + "step": 10150 + }, + { + "epoch": 0.99, + "learning_rate": 2.0296e-05, + "loss": 0.1722, + "step": 10155 + }, + { + "epoch": 0.99, + "learning_rate": 2.0306e-05, + "loss": 0.1475, + "step": 10160 + }, + { + "epoch": 0.99, + "learning_rate": 2.0316e-05, + "loss": 0.1483, + "step": 10165 + }, + { + "epoch": 0.99, + "learning_rate": 2.0326e-05, + "loss": 0.2273, + "step": 10170 + }, + { + "epoch": 0.99, + "learning_rate": 2.0336e-05, + "loss": 0.1717, + "step": 10175 + }, + { + "epoch": 1.0, + "learning_rate": 2.0346e-05, + "loss": 0.1674, + "step": 10180 + }, + { + "epoch": 1.0, + "learning_rate": 2.0356e-05, + "loss": 0.1707, + "step": 10185 + }, + { + "epoch": 1.0, + "learning_rate": 2.0365999999999998e-05, + "loss": 0.1894, + "step": 10190 + }, + { + "epoch": 1.0, + "learning_rate": 2.0376000000000003e-05, + "loss": 0.1565, + "step": 10195 + }, + { + "epoch": 1.0, + "learning_rate": 2.0386e-05, + "loss": 0.1896, + "step": 10200 + }, + { + "epoch": 1.0, + "learning_rate": 2.0396e-05, + "loss": 0.1753, + "step": 10205 + }, + { + "epoch": 1.0, + "learning_rate": 2.0406e-05, + "loss": 0.154, + "step": 10210 + }, + { + "epoch": 1.0, + "learning_rate": 2.0416e-05, + "loss": 0.1427, + "step": 10215 + }, + { + "epoch": 1.0, + "learning_rate": 2.0426e-05, + "loss": 0.1731, + "step": 10220 + }, + { + "epoch": 1.0, + "learning_rate": 2.0436000000000002e-05, + "loss": 0.1467, + "step": 10225 + }, + { + "epoch": 1.0, + "learning_rate": 2.0446e-05, + "loss": 0.1733, + "step": 10230 + }, + { + "epoch": 1.0, + "learning_rate": 2.0456e-05, + "loss": 0.1509, + "step": 10235 + }, + { + "epoch": 1.0, + "learning_rate": 2.0466e-05, + "loss": 0.1438, + "step": 10240 + }, + { + "epoch": 1.0, + "learning_rate": 2.0476000000000002e-05, + "loss": 0.1641, + "step": 10245 + }, + { + "epoch": 1.0, + "learning_rate": 2.0486e-05, + "loss": 0.1473, + "step": 10250 + }, + { + "epoch": 1.0, + "learning_rate": 2.0496e-05, + "loss": 0.1342, + "step": 10255 + }, + { + "epoch": 1.0, + "learning_rate": 2.0506e-05, + "loss": 0.1686, + "step": 10260 + }, + { + "epoch": 1.0, + "learning_rate": 2.0515999999999998e-05, + "loss": 0.1452, + "step": 10265 + }, + { + "epoch": 1.0, + "learning_rate": 2.0526000000000003e-05, + "loss": 0.156, + "step": 10270 + }, + { + "epoch": 1.0, + "learning_rate": 2.0536e-05, + "loss": 0.1717, + "step": 10275 + }, + { + "epoch": 1.01, + "learning_rate": 2.0546e-05, + "loss": 0.1793, + "step": 10280 + }, + { + "epoch": 1.01, + "learning_rate": 2.0556e-05, + "loss": 0.1399, + "step": 10285 + }, + { + "epoch": 1.01, + "learning_rate": 2.0566e-05, + "loss": 0.1551, + "step": 10290 + }, + { + "epoch": 1.01, + "learning_rate": 2.0576e-05, + "loss": 0.1699, + "step": 10295 + }, + { + "epoch": 1.01, + "learning_rate": 2.0586000000000002e-05, + "loss": 0.1493, + "step": 10300 + }, + { + "epoch": 1.01, + "learning_rate": 2.0596e-05, + "loss": 0.1598, + "step": 10305 + }, + { + "epoch": 1.01, + "learning_rate": 2.0606e-05, + "loss": 0.1531, + "step": 10310 + }, + { + "epoch": 1.01, + "learning_rate": 2.0616e-05, + "loss": 0.1631, + "step": 10315 + }, + { + "epoch": 1.01, + "learning_rate": 2.0626000000000002e-05, + "loss": 0.1466, + "step": 10320 + }, + { + "epoch": 1.01, + "learning_rate": 2.0636e-05, + "loss": 0.155, + "step": 10325 + }, + { + "epoch": 1.01, + "learning_rate": 2.0646000000000002e-05, + "loss": 0.1662, + "step": 10330 + }, + { + "epoch": 1.01, + "learning_rate": 2.0656e-05, + "loss": 0.137, + "step": 10335 + }, + { + "epoch": 1.01, + "learning_rate": 2.0666e-05, + "loss": 0.1801, + "step": 10340 + }, + { + "epoch": 1.01, + "learning_rate": 2.0676e-05, + "loss": 0.1841, + "step": 10345 + }, + { + "epoch": 1.01, + "learning_rate": 2.0686e-05, + "loss": 0.1447, + "step": 10350 + }, + { + "epoch": 1.01, + "learning_rate": 2.0696e-05, + "loss": 0.1567, + "step": 10355 + }, + { + "epoch": 1.01, + "learning_rate": 2.0706e-05, + "loss": 0.1613, + "step": 10360 + }, + { + "epoch": 1.01, + "learning_rate": 2.0716e-05, + "loss": 0.1582, + "step": 10365 + }, + { + "epoch": 1.01, + "learning_rate": 2.0725999999999998e-05, + "loss": 0.1449, + "step": 10370 + }, + { + "epoch": 1.01, + "learning_rate": 2.0736000000000003e-05, + "loss": 0.1474, + "step": 10375 + }, + { + "epoch": 1.01, + "learning_rate": 2.0746e-05, + "loss": 0.1948, + "step": 10380 + }, + { + "epoch": 1.02, + "learning_rate": 2.0756e-05, + "loss": 0.134, + "step": 10385 + }, + { + "epoch": 1.02, + "learning_rate": 2.0766e-05, + "loss": 0.1447, + "step": 10390 + }, + { + "epoch": 1.02, + "learning_rate": 2.0776e-05, + "loss": 0.1779, + "step": 10395 + }, + { + "epoch": 1.02, + "learning_rate": 2.0786e-05, + "loss": 0.1567, + "step": 10400 + }, + { + "epoch": 1.02, + "learning_rate": 2.0796000000000002e-05, + "loss": 0.1395, + "step": 10405 + }, + { + "epoch": 1.02, + "learning_rate": 2.0806e-05, + "loss": 0.1868, + "step": 10410 + }, + { + "epoch": 1.02, + "learning_rate": 2.0816e-05, + "loss": 0.1859, + "step": 10415 + }, + { + "epoch": 1.02, + "learning_rate": 2.0826e-05, + "loss": 0.1433, + "step": 10420 + }, + { + "epoch": 1.02, + "learning_rate": 2.0836000000000002e-05, + "loss": 0.1166, + "step": 10425 + }, + { + "epoch": 1.02, + "learning_rate": 2.0846e-05, + "loss": 0.177, + "step": 10430 + }, + { + "epoch": 1.02, + "learning_rate": 2.0856e-05, + "loss": 0.1521, + "step": 10435 + }, + { + "epoch": 1.02, + "learning_rate": 2.0866e-05, + "loss": 0.1433, + "step": 10440 + }, + { + "epoch": 1.02, + "learning_rate": 2.0875999999999998e-05, + "loss": 0.1886, + "step": 10445 + }, + { + "epoch": 1.02, + "learning_rate": 2.0886000000000003e-05, + "loss": 0.1412, + "step": 10450 + }, + { + "epoch": 1.02, + "learning_rate": 2.0896e-05, + "loss": 0.1291, + "step": 10455 + }, + { + "epoch": 1.02, + "learning_rate": 2.0906e-05, + "loss": 0.1726, + "step": 10460 + }, + { + "epoch": 1.02, + "learning_rate": 2.0916e-05, + "loss": 0.1621, + "step": 10465 + }, + { + "epoch": 1.02, + "learning_rate": 2.0926e-05, + "loss": 0.1461, + "step": 10470 + }, + { + "epoch": 1.02, + "learning_rate": 2.0936e-05, + "loss": 0.1531, + "step": 10475 + }, + { + "epoch": 1.02, + "learning_rate": 2.0946000000000002e-05, + "loss": 0.1755, + "step": 10480 + }, + { + "epoch": 1.03, + "learning_rate": 2.0956e-05, + "loss": 0.1397, + "step": 10485 + }, + { + "epoch": 1.03, + "learning_rate": 2.0966e-05, + "loss": 0.1494, + "step": 10490 + }, + { + "epoch": 1.03, + "learning_rate": 2.0976e-05, + "loss": 0.1854, + "step": 10495 + }, + { + "epoch": 1.03, + "learning_rate": 2.0986000000000002e-05, + "loss": 0.1355, + "step": 10500 + }, + { + "epoch": 1.03, + "eval_cer": 0.06653047256347824, + "eval_loss": 0.29528552293777466, + "eval_runtime": 269.6155, + "eval_samples_per_second": 60.716, + "eval_steps_per_second": 1.688, + "eval_wer": 0.17161737722259587, + "step": 10500 + }, + { + "epoch": 1.03, + "learning_rate": 2.0996e-05, + "loss": 0.1467, + "step": 10505 + }, + { + "epoch": 1.03, + "learning_rate": 2.1006000000000002e-05, + "loss": 0.1547, + "step": 10510 + }, + { + "epoch": 1.03, + "learning_rate": 2.1016e-05, + "loss": 0.173, + "step": 10515 + }, + { + "epoch": 1.03, + "learning_rate": 2.1025999999999998e-05, + "loss": 0.1408, + "step": 10520 + }, + { + "epoch": 1.03, + "learning_rate": 2.1036000000000003e-05, + "loss": 0.1541, + "step": 10525 + }, + { + "epoch": 1.03, + "learning_rate": 2.1046e-05, + "loss": 0.1902, + "step": 10530 + }, + { + "epoch": 1.03, + "learning_rate": 2.1056e-05, + "loss": 0.1478, + "step": 10535 + }, + { + "epoch": 1.03, + "learning_rate": 2.1066e-05, + "loss": 0.1509, + "step": 10540 + }, + { + "epoch": 1.03, + "learning_rate": 2.1076e-05, + "loss": 0.1836, + "step": 10545 + }, + { + "epoch": 1.03, + "learning_rate": 2.1086e-05, + "loss": 0.1494, + "step": 10550 + }, + { + "epoch": 1.03, + "learning_rate": 2.1096000000000003e-05, + "loss": 0.1367, + "step": 10555 + }, + { + "epoch": 1.03, + "learning_rate": 2.1106e-05, + "loss": 0.1565, + "step": 10560 + }, + { + "epoch": 1.03, + "learning_rate": 2.1116e-05, + "loss": 0.1784, + "step": 10565 + }, + { + "epoch": 1.03, + "learning_rate": 2.1126e-05, + "loss": 0.141, + "step": 10570 + }, + { + "epoch": 1.03, + "learning_rate": 2.1136000000000002e-05, + "loss": 0.1328, + "step": 10575 + }, + { + "epoch": 1.03, + "learning_rate": 2.1146e-05, + "loss": 0.1857, + "step": 10580 + }, + { + "epoch": 1.04, + "learning_rate": 2.1156000000000002e-05, + "loss": 0.1435, + "step": 10585 + }, + { + "epoch": 1.04, + "learning_rate": 2.1166e-05, + "loss": 0.1484, + "step": 10590 + }, + { + "epoch": 1.04, + "learning_rate": 2.1176e-05, + "loss": 0.1821, + "step": 10595 + }, + { + "epoch": 1.04, + "learning_rate": 2.1186000000000003e-05, + "loss": 0.1508, + "step": 10600 + }, + { + "epoch": 1.04, + "learning_rate": 2.1196000000000002e-05, + "loss": 0.1447, + "step": 10605 + }, + { + "epoch": 1.04, + "learning_rate": 2.1206e-05, + "loss": 0.1438, + "step": 10610 + }, + { + "epoch": 1.04, + "learning_rate": 2.1216e-05, + "loss": 0.1901, + "step": 10615 + }, + { + "epoch": 1.04, + "learning_rate": 2.1226e-05, + "loss": 0.1414, + "step": 10620 + }, + { + "epoch": 1.04, + "learning_rate": 2.1236e-05, + "loss": 0.1503, + "step": 10625 + }, + { + "epoch": 1.04, + "learning_rate": 2.1246000000000003e-05, + "loss": 0.1781, + "step": 10630 + }, + { + "epoch": 1.04, + "learning_rate": 2.1256e-05, + "loss": 0.1453, + "step": 10635 + }, + { + "epoch": 1.04, + "learning_rate": 2.1266e-05, + "loss": 0.1494, + "step": 10640 + }, + { + "epoch": 1.04, + "learning_rate": 2.1276e-05, + "loss": 0.1946, + "step": 10645 + }, + { + "epoch": 1.04, + "learning_rate": 2.1286000000000003e-05, + "loss": 0.1492, + "step": 10650 + }, + { + "epoch": 1.04, + "learning_rate": 2.1296e-05, + "loss": 0.1503, + "step": 10655 + }, + { + "epoch": 1.04, + "learning_rate": 2.1306000000000002e-05, + "loss": 0.1951, + "step": 10660 + }, + { + "epoch": 1.04, + "learning_rate": 2.1316e-05, + "loss": 0.1881, + "step": 10665 + }, + { + "epoch": 1.04, + "learning_rate": 2.1326e-05, + "loss": 0.1491, + "step": 10670 + }, + { + "epoch": 1.04, + "learning_rate": 2.1336000000000004e-05, + "loss": 0.1964, + "step": 10675 + }, + { + "epoch": 1.04, + "learning_rate": 2.1346000000000002e-05, + "loss": 0.1723, + "step": 10680 + }, + { + "epoch": 1.04, + "learning_rate": 2.1356e-05, + "loss": 0.1688, + "step": 10685 + }, + { + "epoch": 1.05, + "learning_rate": 2.1366000000000002e-05, + "loss": 0.1405, + "step": 10690 + }, + { + "epoch": 1.05, + "learning_rate": 2.1376e-05, + "loss": 0.1532, + "step": 10695 + }, + { + "epoch": 1.05, + "learning_rate": 2.1386e-05, + "loss": 0.1496, + "step": 10700 + }, + { + "epoch": 1.05, + "learning_rate": 2.1396e-05, + "loss": 0.1383, + "step": 10705 + }, + { + "epoch": 1.05, + "learning_rate": 2.1406e-05, + "loss": 0.1653, + "step": 10710 + }, + { + "epoch": 1.05, + "learning_rate": 2.1416e-05, + "loss": 0.1664, + "step": 10715 + }, + { + "epoch": 1.05, + "learning_rate": 2.1425999999999998e-05, + "loss": 0.1363, + "step": 10720 + }, + { + "epoch": 1.05, + "learning_rate": 2.1436000000000003e-05, + "loss": 0.1623, + "step": 10725 + }, + { + "epoch": 1.05, + "learning_rate": 2.1446e-05, + "loss": 0.1734, + "step": 10730 + }, + { + "epoch": 1.05, + "learning_rate": 2.1456e-05, + "loss": 0.1439, + "step": 10735 + }, + { + "epoch": 1.05, + "learning_rate": 2.1466e-05, + "loss": 0.1381, + "step": 10740 + }, + { + "epoch": 1.05, + "learning_rate": 2.1476e-05, + "loss": 0.1995, + "step": 10745 + }, + { + "epoch": 1.05, + "learning_rate": 2.1486e-05, + "loss": 0.1384, + "step": 10750 + }, + { + "epoch": 1.05, + "learning_rate": 2.1496000000000002e-05, + "loss": 0.1434, + "step": 10755 + }, + { + "epoch": 1.05, + "learning_rate": 2.1506e-05, + "loss": 0.1565, + "step": 10760 + }, + { + "epoch": 1.05, + "learning_rate": 2.1516e-05, + "loss": 0.1668, + "step": 10765 + }, + { + "epoch": 1.05, + "learning_rate": 2.1526e-05, + "loss": 0.1354, + "step": 10770 + }, + { + "epoch": 1.05, + "learning_rate": 2.1536e-05, + "loss": 0.1327, + "step": 10775 + }, + { + "epoch": 1.05, + "learning_rate": 2.1546e-05, + "loss": 0.1763, + "step": 10780 + }, + { + "epoch": 1.05, + "learning_rate": 2.1556e-05, + "loss": 0.1584, + "step": 10785 + }, + { + "epoch": 1.06, + "learning_rate": 2.1566e-05, + "loss": 0.1507, + "step": 10790 + }, + { + "epoch": 1.06, + "learning_rate": 2.1575999999999998e-05, + "loss": 0.1859, + "step": 10795 + }, + { + "epoch": 1.06, + "learning_rate": 2.1586e-05, + "loss": 0.1509, + "step": 10800 + }, + { + "epoch": 1.06, + "learning_rate": 2.1596e-05, + "loss": 0.1488, + "step": 10805 + }, + { + "epoch": 1.06, + "learning_rate": 2.1606e-05, + "loss": 0.1747, + "step": 10810 + }, + { + "epoch": 1.06, + "learning_rate": 2.1616e-05, + "loss": 0.1773, + "step": 10815 + }, + { + "epoch": 1.06, + "learning_rate": 2.1626e-05, + "loss": 0.1375, + "step": 10820 + }, + { + "epoch": 1.06, + "learning_rate": 2.1635999999999997e-05, + "loss": 0.1519, + "step": 10825 + }, + { + "epoch": 1.06, + "learning_rate": 2.1646000000000002e-05, + "loss": 0.168, + "step": 10830 + }, + { + "epoch": 1.06, + "learning_rate": 2.1656e-05, + "loss": 0.1572, + "step": 10835 + }, + { + "epoch": 1.06, + "learning_rate": 2.1666e-05, + "loss": 0.1483, + "step": 10840 + }, + { + "epoch": 1.06, + "learning_rate": 2.1676e-05, + "loss": 0.1668, + "step": 10845 + }, + { + "epoch": 1.06, + "learning_rate": 2.1686e-05, + "loss": 0.1521, + "step": 10850 + }, + { + "epoch": 1.06, + "learning_rate": 2.1696e-05, + "loss": 0.1544, + "step": 10855 + }, + { + "epoch": 1.06, + "learning_rate": 2.1706000000000002e-05, + "loss": 0.1546, + "step": 10860 + }, + { + "epoch": 1.06, + "learning_rate": 2.1716e-05, + "loss": 0.1714, + "step": 10865 + }, + { + "epoch": 1.06, + "learning_rate": 2.1726e-05, + "loss": 0.1501, + "step": 10870 + }, + { + "epoch": 1.06, + "learning_rate": 2.1736e-05, + "loss": 0.1427, + "step": 10875 + }, + { + "epoch": 1.06, + "learning_rate": 2.1746e-05, + "loss": 0.1932, + "step": 10880 + }, + { + "epoch": 1.06, + "learning_rate": 2.1756e-05, + "loss": 0.1535, + "step": 10885 + }, + { + "epoch": 1.06, + "learning_rate": 2.1766e-05, + "loss": 0.1543, + "step": 10890 + }, + { + "epoch": 1.07, + "learning_rate": 2.1776e-05, + "loss": 0.1953, + "step": 10895 + }, + { + "epoch": 1.07, + "learning_rate": 2.1785999999999998e-05, + "loss": 0.1589, + "step": 10900 + }, + { + "epoch": 1.07, + "learning_rate": 2.1796000000000003e-05, + "loss": 0.1447, + "step": 10905 + }, + { + "epoch": 1.07, + "learning_rate": 2.1806e-05, + "loss": 0.1768, + "step": 10910 + }, + { + "epoch": 1.07, + "learning_rate": 2.1816e-05, + "loss": 0.1509, + "step": 10915 + }, + { + "epoch": 1.07, + "learning_rate": 2.1826e-05, + "loss": 0.143, + "step": 10920 + }, + { + "epoch": 1.07, + "learning_rate": 2.1836e-05, + "loss": 0.1603, + "step": 10925 + }, + { + "epoch": 1.07, + "learning_rate": 2.1846e-05, + "loss": 0.2045, + "step": 10930 + }, + { + "epoch": 1.07, + "learning_rate": 2.1856000000000002e-05, + "loss": 0.1434, + "step": 10935 + }, + { + "epoch": 1.07, + "learning_rate": 2.1866e-05, + "loss": 0.1428, + "step": 10940 + }, + { + "epoch": 1.07, + "learning_rate": 2.1876e-05, + "loss": 0.1939, + "step": 10945 + }, + { + "epoch": 1.07, + "learning_rate": 2.1886e-05, + "loss": 0.1701, + "step": 10950 + }, + { + "epoch": 1.07, + "learning_rate": 2.1896000000000002e-05, + "loss": 0.1447, + "step": 10955 + }, + { + "epoch": 1.07, + "learning_rate": 2.1906e-05, + "loss": 0.1622, + "step": 10960 + }, + { + "epoch": 1.07, + "learning_rate": 2.1916e-05, + "loss": 0.1824, + "step": 10965 + }, + { + "epoch": 1.07, + "learning_rate": 2.1926e-05, + "loss": 0.1549, + "step": 10970 + }, + { + "epoch": 1.07, + "learning_rate": 2.1935999999999998e-05, + "loss": 0.177, + "step": 10975 + }, + { + "epoch": 1.07, + "learning_rate": 2.1946000000000003e-05, + "loss": 0.2208, + "step": 10980 + }, + { + "epoch": 1.07, + "learning_rate": 2.1956e-05, + "loss": 0.1584, + "step": 10985 + }, + { + "epoch": 1.07, + "learning_rate": 2.1966e-05, + "loss": 0.1489, + "step": 10990 + }, + { + "epoch": 1.08, + "learning_rate": 2.1976e-05, + "loss": 0.1786, + "step": 10995 + }, + { + "epoch": 1.08, + "learning_rate": 2.1986e-05, + "loss": 0.1538, + "step": 11000 + }, + { + "epoch": 1.08, + "eval_cer": 0.06717907096660816, + "eval_loss": 0.28717195987701416, + "eval_runtime": 269.1324, + "eval_samples_per_second": 60.825, + "eval_steps_per_second": 1.691, + "eval_wer": 0.17326942792030978, + "step": 11000 + }, + { + "epoch": 1.08, + "learning_rate": 2.1996e-05, + "loss": 0.1408, + "step": 11005 + }, + { + "epoch": 1.08, + "learning_rate": 2.2006000000000002e-05, + "loss": 0.1635, + "step": 11010 + }, + { + "epoch": 1.08, + "learning_rate": 2.2016e-05, + "loss": 0.1589, + "step": 11015 + }, + { + "epoch": 1.08, + "learning_rate": 2.2026e-05, + "loss": 0.1457, + "step": 11020 + }, + { + "epoch": 1.08, + "learning_rate": 2.2036e-05, + "loss": 0.1528, + "step": 11025 + }, + { + "epoch": 1.08, + "learning_rate": 2.2046000000000002e-05, + "loss": 0.1818, + "step": 11030 + }, + { + "epoch": 1.08, + "learning_rate": 2.2056e-05, + "loss": 0.1467, + "step": 11035 + }, + { + "epoch": 1.08, + "learning_rate": 2.2066000000000002e-05, + "loss": 0.1485, + "step": 11040 + }, + { + "epoch": 1.08, + "learning_rate": 2.2076e-05, + "loss": 0.2049, + "step": 11045 + }, + { + "epoch": 1.08, + "learning_rate": 2.2085999999999998e-05, + "loss": 0.1556, + "step": 11050 + }, + { + "epoch": 1.08, + "learning_rate": 2.2096000000000003e-05, + "loss": 0.1541, + "step": 11055 + }, + { + "epoch": 1.08, + "learning_rate": 2.2106e-05, + "loss": 0.1675, + "step": 11060 + }, + { + "epoch": 1.08, + "learning_rate": 2.2116e-05, + "loss": 0.1672, + "step": 11065 + }, + { + "epoch": 1.08, + "learning_rate": 2.2126e-05, + "loss": 0.1598, + "step": 11070 + }, + { + "epoch": 1.08, + "learning_rate": 2.2136e-05, + "loss": 0.1591, + "step": 11075 + }, + { + "epoch": 1.08, + "learning_rate": 2.2146e-05, + "loss": 0.1873, + "step": 11080 + }, + { + "epoch": 1.08, + "learning_rate": 2.2156000000000003e-05, + "loss": 0.1569, + "step": 11085 + }, + { + "epoch": 1.08, + "learning_rate": 2.2166e-05, + "loss": 0.1408, + "step": 11090 + }, + { + "epoch": 1.08, + "learning_rate": 2.2176e-05, + "loss": 0.2053, + "step": 11095 + }, + { + "epoch": 1.09, + "learning_rate": 2.2186e-05, + "loss": 0.1449, + "step": 11100 + }, + { + "epoch": 1.09, + "learning_rate": 2.2196000000000002e-05, + "loss": 0.1455, + "step": 11105 + }, + { + "epoch": 1.09, + "learning_rate": 2.2206e-05, + "loss": 0.179, + "step": 11110 + }, + { + "epoch": 1.09, + "learning_rate": 2.2216000000000002e-05, + "loss": 0.1656, + "step": 11115 + }, + { + "epoch": 1.09, + "learning_rate": 2.2226e-05, + "loss": 0.1372, + "step": 11120 + }, + { + "epoch": 1.09, + "learning_rate": 2.2236e-05, + "loss": 0.143, + "step": 11125 + }, + { + "epoch": 1.09, + "learning_rate": 2.2246000000000004e-05, + "loss": 0.1712, + "step": 11130 + }, + { + "epoch": 1.09, + "learning_rate": 2.2256000000000002e-05, + "loss": 0.1462, + "step": 11135 + }, + { + "epoch": 1.09, + "learning_rate": 2.2266e-05, + "loss": 0.1497, + "step": 11140 + }, + { + "epoch": 1.09, + "learning_rate": 2.2276e-05, + "loss": 0.1728, + "step": 11145 + }, + { + "epoch": 1.09, + "learning_rate": 2.2286e-05, + "loss": 0.1447, + "step": 11150 + }, + { + "epoch": 1.09, + "learning_rate": 2.2296e-05, + "loss": 0.1429, + "step": 11155 + }, + { + "epoch": 1.09, + "learning_rate": 2.2306000000000003e-05, + "loss": 0.1534, + "step": 11160 + }, + { + "epoch": 1.09, + "learning_rate": 2.2316e-05, + "loss": 0.1549, + "step": 11165 + }, + { + "epoch": 1.09, + "learning_rate": 2.2326e-05, + "loss": 0.1361, + "step": 11170 + }, + { + "epoch": 1.09, + "learning_rate": 2.2336e-05, + "loss": 0.164, + "step": 11175 + }, + { + "epoch": 1.09, + "learning_rate": 2.2346000000000003e-05, + "loss": 0.1921, + "step": 11180 + }, + { + "epoch": 1.09, + "learning_rate": 2.2356e-05, + "loss": 0.1434, + "step": 11185 + }, + { + "epoch": 1.09, + "learning_rate": 2.2366000000000002e-05, + "loss": 0.1543, + "step": 11190 + }, + { + "epoch": 1.09, + "learning_rate": 2.2376e-05, + "loss": 0.1866, + "step": 11195 + }, + { + "epoch": 1.1, + "learning_rate": 2.2386e-05, + "loss": 0.1607, + "step": 11200 + }, + { + "epoch": 1.1, + "learning_rate": 2.2396e-05, + "loss": 0.1634, + "step": 11205 + }, + { + "epoch": 1.1, + "learning_rate": 2.2406000000000002e-05, + "loss": 0.1834, + "step": 11210 + }, + { + "epoch": 1.1, + "learning_rate": 2.2416e-05, + "loss": 0.1654, + "step": 11215 + }, + { + "epoch": 1.1, + "learning_rate": 2.2426000000000002e-05, + "loss": 0.1505, + "step": 11220 + }, + { + "epoch": 1.1, + "learning_rate": 2.2436e-05, + "loss": 0.1576, + "step": 11225 + }, + { + "epoch": 1.1, + "learning_rate": 2.2445999999999998e-05, + "loss": 0.1833, + "step": 11230 + }, + { + "epoch": 1.1, + "learning_rate": 2.2456000000000003e-05, + "loss": 0.1344, + "step": 11235 + }, + { + "epoch": 1.1, + "learning_rate": 2.2466e-05, + "loss": 0.1524, + "step": 11240 + }, + { + "epoch": 1.1, + "learning_rate": 2.2476e-05, + "loss": 0.1672, + "step": 11245 + }, + { + "epoch": 1.1, + "learning_rate": 2.2486e-05, + "loss": 0.1502, + "step": 11250 + }, + { + "epoch": 1.1, + "learning_rate": 2.2496e-05, + "loss": 0.1483, + "step": 11255 + }, + { + "epoch": 1.1, + "learning_rate": 2.2506e-05, + "loss": 0.1671, + "step": 11260 + }, + { + "epoch": 1.1, + "learning_rate": 2.2516000000000003e-05, + "loss": 0.1562, + "step": 11265 + }, + { + "epoch": 1.1, + "learning_rate": 2.2526e-05, + "loss": 0.1531, + "step": 11270 + }, + { + "epoch": 1.1, + "learning_rate": 2.2536e-05, + "loss": 0.1397, + "step": 11275 + }, + { + "epoch": 1.1, + "learning_rate": 2.2546e-05, + "loss": 0.1805, + "step": 11280 + }, + { + "epoch": 1.1, + "learning_rate": 2.2556000000000002e-05, + "loss": 0.151, + "step": 11285 + }, + { + "epoch": 1.1, + "learning_rate": 2.2566e-05, + "loss": 0.1617, + "step": 11290 + }, + { + "epoch": 1.1, + "learning_rate": 2.2576000000000002e-05, + "loss": 0.2115, + "step": 11295 + }, + { + "epoch": 1.1, + "learning_rate": 2.2586e-05, + "loss": 0.1583, + "step": 11300 + }, + { + "epoch": 1.11, + "learning_rate": 2.2596e-05, + "loss": 0.1471, + "step": 11305 + }, + { + "epoch": 1.11, + "learning_rate": 2.2606000000000003e-05, + "loss": 0.1888, + "step": 11310 + }, + { + "epoch": 1.11, + "learning_rate": 2.2616e-05, + "loss": 0.1657, + "step": 11315 + }, + { + "epoch": 1.11, + "learning_rate": 2.2626e-05, + "loss": 0.1401, + "step": 11320 + }, + { + "epoch": 1.11, + "learning_rate": 2.2635999999999998e-05, + "loss": 0.157, + "step": 11325 + }, + { + "epoch": 1.11, + "learning_rate": 2.2646e-05, + "loss": 0.1814, + "step": 11330 + }, + { + "epoch": 1.11, + "learning_rate": 2.2656e-05, + "loss": 0.1514, + "step": 11335 + }, + { + "epoch": 1.11, + "learning_rate": 2.2666e-05, + "loss": 0.1376, + "step": 11340 + }, + { + "epoch": 1.11, + "learning_rate": 2.2676e-05, + "loss": 0.1926, + "step": 11345 + }, + { + "epoch": 1.11, + "learning_rate": 2.2686e-05, + "loss": 0.1519, + "step": 11350 + }, + { + "epoch": 1.11, + "learning_rate": 2.2695999999999998e-05, + "loss": 0.135, + "step": 11355 + }, + { + "epoch": 1.11, + "learning_rate": 2.2706000000000002e-05, + "loss": 0.1616, + "step": 11360 + }, + { + "epoch": 1.11, + "learning_rate": 2.2716e-05, + "loss": 0.1645, + "step": 11365 + }, + { + "epoch": 1.11, + "learning_rate": 2.2726e-05, + "loss": 0.1252, + "step": 11370 + }, + { + "epoch": 1.11, + "learning_rate": 2.2736e-05, + "loss": 0.1504, + "step": 11375 + }, + { + "epoch": 1.11, + "learning_rate": 2.2746e-05, + "loss": 0.1757, + "step": 11380 + }, + { + "epoch": 1.11, + "learning_rate": 2.2756e-05, + "loss": 0.1547, + "step": 11385 + }, + { + "epoch": 1.11, + "learning_rate": 2.2766000000000002e-05, + "loss": 0.1467, + "step": 11390 + }, + { + "epoch": 1.11, + "learning_rate": 2.2776e-05, + "loss": 0.1926, + "step": 11395 + }, + { + "epoch": 1.11, + "learning_rate": 2.2786e-05, + "loss": 0.1442, + "step": 11400 + }, + { + "epoch": 1.12, + "learning_rate": 2.2796e-05, + "loss": 0.1546, + "step": 11405 + }, + { + "epoch": 1.12, + "learning_rate": 2.2806e-05, + "loss": 0.1883, + "step": 11410 + }, + { + "epoch": 1.12, + "learning_rate": 2.2816e-05, + "loss": 0.1728, + "step": 11415 + }, + { + "epoch": 1.12, + "learning_rate": 2.2826e-05, + "loss": 0.1531, + "step": 11420 + }, + { + "epoch": 1.12, + "learning_rate": 2.2836e-05, + "loss": 0.1391, + "step": 11425 + }, + { + "epoch": 1.12, + "learning_rate": 2.2845999999999998e-05, + "loss": 0.1775, + "step": 11430 + }, + { + "epoch": 1.12, + "learning_rate": 2.2856000000000003e-05, + "loss": 0.1571, + "step": 11435 + }, + { + "epoch": 1.12, + "learning_rate": 2.2866e-05, + "loss": 0.1564, + "step": 11440 + }, + { + "epoch": 1.12, + "learning_rate": 2.2876e-05, + "loss": 0.1712, + "step": 11445 + }, + { + "epoch": 1.12, + "learning_rate": 2.2886e-05, + "loss": 0.1399, + "step": 11450 + }, + { + "epoch": 1.12, + "learning_rate": 2.2896e-05, + "loss": 0.1397, + "step": 11455 + }, + { + "epoch": 1.12, + "learning_rate": 2.2906e-05, + "loss": 0.1864, + "step": 11460 + }, + { + "epoch": 1.12, + "learning_rate": 2.2916000000000002e-05, + "loss": 0.1843, + "step": 11465 + }, + { + "epoch": 1.12, + "learning_rate": 2.2926e-05, + "loss": 0.1508, + "step": 11470 + }, + { + "epoch": 1.12, + "learning_rate": 2.2936e-05, + "loss": 0.1482, + "step": 11475 + }, + { + "epoch": 1.12, + "learning_rate": 2.2946e-05, + "loss": 0.1829, + "step": 11480 + }, + { + "epoch": 1.12, + "learning_rate": 2.2956000000000002e-05, + "loss": 0.1385, + "step": 11485 + }, + { + "epoch": 1.12, + "learning_rate": 2.2966e-05, + "loss": 0.1594, + "step": 11490 + }, + { + "epoch": 1.12, + "learning_rate": 2.2976e-05, + "loss": 0.1658, + "step": 11495 + }, + { + "epoch": 1.12, + "learning_rate": 2.2986e-05, + "loss": 0.1448, + "step": 11500 + }, + { + "epoch": 1.12, + "eval_cer": 0.06571192056808434, + "eval_loss": 0.29266980290412903, + "eval_runtime": 269.19, + "eval_samples_per_second": 60.812, + "eval_steps_per_second": 1.69, + "eval_wer": 0.16950170755437727, + "step": 11500 + }, + { + "epoch": 1.12, + "learning_rate": 2.2995999999999998e-05, + "loss": 0.1521, + "step": 11505 + }, + { + "epoch": 1.13, + "learning_rate": 2.3006000000000003e-05, + "loss": 0.1673, + "step": 11510 + }, + { + "epoch": 1.13, + "learning_rate": 2.3016e-05, + "loss": 0.1803, + "step": 11515 + }, + { + "epoch": 1.13, + "learning_rate": 2.3026e-05, + "loss": 0.1325, + "step": 11520 + }, + { + "epoch": 1.13, + "learning_rate": 2.3036e-05, + "loss": 0.158, + "step": 11525 + }, + { + "epoch": 1.13, + "learning_rate": 2.3046e-05, + "loss": 0.1622, + "step": 11530 + }, + { + "epoch": 1.13, + "learning_rate": 2.3056e-05, + "loss": 0.152, + "step": 11535 + }, + { + "epoch": 1.13, + "learning_rate": 2.3066000000000002e-05, + "loss": 0.133, + "step": 11540 + }, + { + "epoch": 1.13, + "learning_rate": 2.3076e-05, + "loss": 0.1809, + "step": 11545 + }, + { + "epoch": 1.13, + "learning_rate": 2.3086e-05, + "loss": 0.1789, + "step": 11550 + }, + { + "epoch": 1.13, + "learning_rate": 2.3096e-05, + "loss": 0.1481, + "step": 11555 + }, + { + "epoch": 1.13, + "learning_rate": 2.3106000000000002e-05, + "loss": 0.1724, + "step": 11560 + }, + { + "epoch": 1.13, + "learning_rate": 2.3116e-05, + "loss": 0.1631, + "step": 11565 + }, + { + "epoch": 1.13, + "learning_rate": 2.3126000000000002e-05, + "loss": 0.1292, + "step": 11570 + }, + { + "epoch": 1.13, + "learning_rate": 2.3136e-05, + "loss": 0.1624, + "step": 11575 + }, + { + "epoch": 1.13, + "learning_rate": 2.3145999999999998e-05, + "loss": 0.1533, + "step": 11580 + }, + { + "epoch": 1.13, + "learning_rate": 2.3156000000000003e-05, + "loss": 0.1421, + "step": 11585 + }, + { + "epoch": 1.13, + "learning_rate": 2.3166e-05, + "loss": 0.1571, + "step": 11590 + }, + { + "epoch": 1.13, + "learning_rate": 2.3176e-05, + "loss": 0.186, + "step": 11595 + }, + { + "epoch": 1.13, + "learning_rate": 2.3186e-05, + "loss": 0.1578, + "step": 11600 + }, + { + "epoch": 1.13, + "learning_rate": 2.3196e-05, + "loss": 0.1578, + "step": 11605 + }, + { + "epoch": 1.14, + "learning_rate": 2.3206e-05, + "loss": 0.1686, + "step": 11610 + }, + { + "epoch": 1.14, + "learning_rate": 2.3216000000000003e-05, + "loss": 0.1534, + "step": 11615 + }, + { + "epoch": 1.14, + "learning_rate": 2.3226e-05, + "loss": 0.1472, + "step": 11620 + }, + { + "epoch": 1.14, + "learning_rate": 2.3236e-05, + "loss": 0.1623, + "step": 11625 + }, + { + "epoch": 1.14, + "learning_rate": 2.3246e-05, + "loss": 0.1883, + "step": 11630 + }, + { + "epoch": 1.14, + "learning_rate": 2.3256e-05, + "loss": 0.1615, + "step": 11635 + }, + { + "epoch": 1.14, + "learning_rate": 2.3266e-05, + "loss": 0.1278, + "step": 11640 + }, + { + "epoch": 1.14, + "learning_rate": 2.3276000000000002e-05, + "loss": 0.161, + "step": 11645 + }, + { + "epoch": 1.14, + "learning_rate": 2.3286e-05, + "loss": 0.1434, + "step": 11650 + }, + { + "epoch": 1.14, + "learning_rate": 2.3296e-05, + "loss": 0.1452, + "step": 11655 + }, + { + "epoch": 1.14, + "learning_rate": 2.3306e-05, + "loss": 0.1772, + "step": 11660 + }, + { + "epoch": 1.14, + "learning_rate": 2.3316000000000002e-05, + "loss": 0.1702, + "step": 11665 + }, + { + "epoch": 1.14, + "learning_rate": 2.3326e-05, + "loss": 0.1231, + "step": 11670 + }, + { + "epoch": 1.14, + "learning_rate": 2.3336e-05, + "loss": 0.1701, + "step": 11675 + }, + { + "epoch": 1.14, + "learning_rate": 2.3346e-05, + "loss": 0.1785, + "step": 11680 + }, + { + "epoch": 1.14, + "learning_rate": 2.3355999999999998e-05, + "loss": 0.1501, + "step": 11685 + }, + { + "epoch": 1.14, + "learning_rate": 2.3366000000000003e-05, + "loss": 0.152, + "step": 11690 + }, + { + "epoch": 1.14, + "learning_rate": 2.3376e-05, + "loss": 0.1968, + "step": 11695 + }, + { + "epoch": 1.14, + "learning_rate": 2.3386e-05, + "loss": 0.1416, + "step": 11700 + }, + { + "epoch": 1.14, + "learning_rate": 2.3396e-05, + "loss": 0.1446, + "step": 11705 + }, + { + "epoch": 1.15, + "learning_rate": 2.3406e-05, + "loss": 0.167, + "step": 11710 + }, + { + "epoch": 1.15, + "learning_rate": 2.3416e-05, + "loss": 0.1753, + "step": 11715 + }, + { + "epoch": 1.15, + "learning_rate": 2.3426000000000002e-05, + "loss": 0.148, + "step": 11720 + }, + { + "epoch": 1.15, + "learning_rate": 2.3436e-05, + "loss": 0.1483, + "step": 11725 + }, + { + "epoch": 1.15, + "learning_rate": 2.3446e-05, + "loss": 0.1758, + "step": 11730 + }, + { + "epoch": 1.15, + "learning_rate": 2.3456e-05, + "loss": 0.1575, + "step": 11735 + }, + { + "epoch": 1.15, + "learning_rate": 2.3466000000000002e-05, + "loss": 0.1645, + "step": 11740 + }, + { + "epoch": 1.15, + "learning_rate": 2.3476e-05, + "loss": 0.1843, + "step": 11745 + }, + { + "epoch": 1.15, + "learning_rate": 2.3486000000000002e-05, + "loss": 0.1575, + "step": 11750 + }, + { + "epoch": 1.15, + "learning_rate": 2.3496e-05, + "loss": 0.1454, + "step": 11755 + }, + { + "epoch": 1.15, + "learning_rate": 2.3505999999999998e-05, + "loss": 0.168, + "step": 11760 + }, + { + "epoch": 1.15, + "learning_rate": 2.3516000000000003e-05, + "loss": 0.1729, + "step": 11765 + }, + { + "epoch": 1.15, + "learning_rate": 2.3526e-05, + "loss": 0.1289, + "step": 11770 + }, + { + "epoch": 1.15, + "learning_rate": 2.3536e-05, + "loss": 0.1516, + "step": 11775 + }, + { + "epoch": 1.15, + "learning_rate": 2.3546e-05, + "loss": 0.1822, + "step": 11780 + }, + { + "epoch": 1.15, + "learning_rate": 2.3556e-05, + "loss": 0.1401, + "step": 11785 + }, + { + "epoch": 1.15, + "learning_rate": 2.3566e-05, + "loss": 0.1339, + "step": 11790 + }, + { + "epoch": 1.15, + "learning_rate": 2.3576000000000003e-05, + "loss": 0.1561, + "step": 11795 + }, + { + "epoch": 1.15, + "learning_rate": 2.3586e-05, + "loss": 0.1343, + "step": 11800 + }, + { + "epoch": 1.15, + "learning_rate": 2.3596e-05, + "loss": 0.1586, + "step": 11805 + }, + { + "epoch": 1.15, + "learning_rate": 2.3606e-05, + "loss": 0.1582, + "step": 11810 + }, + { + "epoch": 1.16, + "learning_rate": 2.3616000000000002e-05, + "loss": 0.1616, + "step": 11815 + }, + { + "epoch": 1.16, + "learning_rate": 2.3626e-05, + "loss": 0.1534, + "step": 11820 + }, + { + "epoch": 1.16, + "learning_rate": 2.3636000000000002e-05, + "loss": 0.16, + "step": 11825 + }, + { + "epoch": 1.16, + "learning_rate": 2.3646e-05, + "loss": 0.1583, + "step": 11830 + }, + { + "epoch": 1.16, + "learning_rate": 2.3656e-05, + "loss": 0.1384, + "step": 11835 + }, + { + "epoch": 1.16, + "learning_rate": 2.3666000000000003e-05, + "loss": 0.1458, + "step": 11840 + }, + { + "epoch": 1.16, + "learning_rate": 2.3676e-05, + "loss": 0.1727, + "step": 11845 + }, + { + "epoch": 1.16, + "learning_rate": 2.3686e-05, + "loss": 0.156, + "step": 11850 + }, + { + "epoch": 1.16, + "learning_rate": 2.3696e-05, + "loss": 0.1542, + "step": 11855 + }, + { + "epoch": 1.16, + "learning_rate": 2.3706e-05, + "loss": 0.1715, + "step": 11860 + }, + { + "epoch": 1.16, + "learning_rate": 2.3716e-05, + "loss": 0.1767, + "step": 11865 + }, + { + "epoch": 1.16, + "learning_rate": 2.3726000000000003e-05, + "loss": 0.128, + "step": 11870 + }, + { + "epoch": 1.16, + "learning_rate": 2.3736e-05, + "loss": 0.1489, + "step": 11875 + }, + { + "epoch": 1.16, + "learning_rate": 2.3746e-05, + "loss": 0.1764, + "step": 11880 + }, + { + "epoch": 1.16, + "learning_rate": 2.3756e-05, + "loss": 0.1401, + "step": 11885 + }, + { + "epoch": 1.16, + "learning_rate": 2.3766000000000003e-05, + "loss": 0.131, + "step": 11890 + }, + { + "epoch": 1.16, + "learning_rate": 2.3776e-05, + "loss": 0.17, + "step": 11895 + }, + { + "epoch": 1.16, + "learning_rate": 2.3786000000000002e-05, + "loss": 0.1617, + "step": 11900 + }, + { + "epoch": 1.16, + "learning_rate": 2.3796e-05, + "loss": 0.136, + "step": 11905 + }, + { + "epoch": 1.16, + "learning_rate": 2.3806e-05, + "loss": 0.1645, + "step": 11910 + }, + { + "epoch": 1.17, + "learning_rate": 2.3816000000000004e-05, + "loss": 0.1715, + "step": 11915 + }, + { + "epoch": 1.17, + "learning_rate": 2.3826000000000002e-05, + "loss": 0.1362, + "step": 11920 + }, + { + "epoch": 1.17, + "learning_rate": 2.3836e-05, + "loss": 0.1464, + "step": 11925 + }, + { + "epoch": 1.17, + "learning_rate": 2.3846000000000002e-05, + "loss": 0.1824, + "step": 11930 + }, + { + "epoch": 1.17, + "learning_rate": 2.3856e-05, + "loss": 0.1329, + "step": 11935 + }, + { + "epoch": 1.17, + "learning_rate": 2.3866e-05, + "loss": 0.1479, + "step": 11940 + }, + { + "epoch": 1.17, + "learning_rate": 2.3876e-05, + "loss": 0.1937, + "step": 11945 + }, + { + "epoch": 1.17, + "learning_rate": 2.3886e-05, + "loss": 0.1415, + "step": 11950 + }, + { + "epoch": 1.17, + "learning_rate": 2.3896e-05, + "loss": 0.1557, + "step": 11955 + }, + { + "epoch": 1.17, + "learning_rate": 2.3905999999999998e-05, + "loss": 0.1636, + "step": 11960 + }, + { + "epoch": 1.17, + "learning_rate": 2.3916000000000003e-05, + "loss": 0.1621, + "step": 11965 + }, + { + "epoch": 1.17, + "learning_rate": 2.3926e-05, + "loss": 0.1463, + "step": 11970 + }, + { + "epoch": 1.17, + "learning_rate": 2.3936e-05, + "loss": 0.1445, + "step": 11975 + }, + { + "epoch": 1.17, + "learning_rate": 2.3946e-05, + "loss": 0.1799, + "step": 11980 + }, + { + "epoch": 1.17, + "learning_rate": 2.3956e-05, + "loss": 0.1402, + "step": 11985 + }, + { + "epoch": 1.17, + "learning_rate": 2.3966e-05, + "loss": 0.1388, + "step": 11990 + }, + { + "epoch": 1.17, + "learning_rate": 2.3976000000000002e-05, + "loss": 0.1907, + "step": 11995 + }, + { + "epoch": 1.17, + "learning_rate": 2.3986e-05, + "loss": 0.1686, + "step": 12000 + }, + { + "epoch": 1.17, + "eval_cer": 0.06725075207354944, + "eval_loss": 0.2864223122596741, + "eval_runtime": 268.825, + "eval_samples_per_second": 60.895, + "eval_steps_per_second": 1.693, + "eval_wer": 0.1731061818039349, + "step": 12000 + }, + { + "epoch": 1.17, + "learning_rate": 2.3996e-05, + "loss": 0.1438, + "step": 12005 + }, + { + "epoch": 1.17, + "learning_rate": 2.4006e-05, + "loss": 0.1677, + "step": 12010 + }, + { + "epoch": 1.17, + "learning_rate": 2.4016000000000002e-05, + "loss": 0.1722, + "step": 12015 + }, + { + "epoch": 1.18, + "learning_rate": 2.4026e-05, + "loss": 0.1482, + "step": 12020 + }, + { + "epoch": 1.18, + "learning_rate": 2.4036e-05, + "loss": 0.1531, + "step": 12025 + }, + { + "epoch": 1.18, + "learning_rate": 2.4046e-05, + "loss": 0.1596, + "step": 12030 + }, + { + "epoch": 1.18, + "learning_rate": 2.4055999999999998e-05, + "loss": 0.1454, + "step": 12035 + }, + { + "epoch": 1.18, + "learning_rate": 2.4066000000000003e-05, + "loss": 0.1476, + "step": 12040 + }, + { + "epoch": 1.18, + "learning_rate": 2.4076e-05, + "loss": 0.1847, + "step": 12045 + }, + { + "epoch": 1.18, + "learning_rate": 2.4086e-05, + "loss": 0.1697, + "step": 12050 + }, + { + "epoch": 1.18, + "learning_rate": 2.4096e-05, + "loss": 0.1562, + "step": 12055 + }, + { + "epoch": 1.18, + "learning_rate": 2.4106e-05, + "loss": 0.1573, + "step": 12060 + }, + { + "epoch": 1.18, + "learning_rate": 2.4116e-05, + "loss": 0.1672, + "step": 12065 + }, + { + "epoch": 1.18, + "learning_rate": 2.4126000000000002e-05, + "loss": 0.1519, + "step": 12070 + }, + { + "epoch": 1.18, + "learning_rate": 2.4136e-05, + "loss": 0.1323, + "step": 12075 + }, + { + "epoch": 1.18, + "learning_rate": 2.4146e-05, + "loss": 0.1931, + "step": 12080 + }, + { + "epoch": 1.18, + "learning_rate": 2.4156e-05, + "loss": 0.1482, + "step": 12085 + }, + { + "epoch": 1.18, + "learning_rate": 2.4166e-05, + "loss": 0.1382, + "step": 12090 + }, + { + "epoch": 1.18, + "learning_rate": 2.4176e-05, + "loss": 0.1796, + "step": 12095 + }, + { + "epoch": 1.18, + "learning_rate": 2.4186000000000002e-05, + "loss": 0.1592, + "step": 12100 + }, + { + "epoch": 1.18, + "learning_rate": 2.4196e-05, + "loss": 0.1647, + "step": 12105 + }, + { + "epoch": 1.18, + "learning_rate": 2.4205999999999998e-05, + "loss": 0.1531, + "step": 12110 + }, + { + "epoch": 1.18, + "learning_rate": 2.4216e-05, + "loss": 0.1577, + "step": 12115 + }, + { + "epoch": 1.19, + "learning_rate": 2.4226e-05, + "loss": 0.1333, + "step": 12120 + }, + { + "epoch": 1.19, + "learning_rate": 2.4236e-05, + "loss": 0.1372, + "step": 12125 + }, + { + "epoch": 1.19, + "learning_rate": 2.4246e-05, + "loss": 0.1817, + "step": 12130 + }, + { + "epoch": 1.19, + "learning_rate": 2.4256e-05, + "loss": 0.133, + "step": 12135 + }, + { + "epoch": 1.19, + "learning_rate": 2.4265999999999998e-05, + "loss": 0.1602, + "step": 12140 + }, + { + "epoch": 1.19, + "learning_rate": 2.4276000000000003e-05, + "loss": 0.1824, + "step": 12145 + }, + { + "epoch": 1.19, + "learning_rate": 2.4286e-05, + "loss": 0.1588, + "step": 12150 + }, + { + "epoch": 1.19, + "learning_rate": 2.4296e-05, + "loss": 0.1576, + "step": 12155 + }, + { + "epoch": 1.19, + "learning_rate": 2.4306e-05, + "loss": 0.1636, + "step": 12160 + }, + { + "epoch": 1.19, + "learning_rate": 2.4316e-05, + "loss": 0.1683, + "step": 12165 + }, + { + "epoch": 1.19, + "learning_rate": 2.4326e-05, + "loss": 0.1423, + "step": 12170 + }, + { + "epoch": 1.19, + "learning_rate": 2.4336000000000002e-05, + "loss": 0.1515, + "step": 12175 + }, + { + "epoch": 1.19, + "learning_rate": 2.4346e-05, + "loss": 0.1793, + "step": 12180 + }, + { + "epoch": 1.19, + "learning_rate": 2.4356e-05, + "loss": 0.1535, + "step": 12185 + }, + { + "epoch": 1.19, + "learning_rate": 2.4366e-05, + "loss": 0.1547, + "step": 12190 + }, + { + "epoch": 1.19, + "learning_rate": 2.4376000000000002e-05, + "loss": 0.1966, + "step": 12195 + }, + { + "epoch": 1.19, + "learning_rate": 2.4386e-05, + "loss": 0.156, + "step": 12200 + }, + { + "epoch": 1.19, + "learning_rate": 2.4396e-05, + "loss": 0.1533, + "step": 12205 + }, + { + "epoch": 1.19, + "learning_rate": 2.4406e-05, + "loss": 0.1502, + "step": 12210 + }, + { + "epoch": 1.19, + "learning_rate": 2.4415999999999998e-05, + "loss": 0.1549, + "step": 12215 + }, + { + "epoch": 1.19, + "learning_rate": 2.4426000000000003e-05, + "loss": 0.1338, + "step": 12220 + }, + { + "epoch": 1.2, + "learning_rate": 2.4436e-05, + "loss": 0.156, + "step": 12225 + }, + { + "epoch": 1.2, + "learning_rate": 2.4446e-05, + "loss": 0.1831, + "step": 12230 + }, + { + "epoch": 1.2, + "learning_rate": 2.4456e-05, + "loss": 0.1435, + "step": 12235 + }, + { + "epoch": 1.2, + "learning_rate": 2.4466e-05, + "loss": 0.157, + "step": 12240 + }, + { + "epoch": 1.2, + "learning_rate": 2.4476e-05, + "loss": 0.1603, + "step": 12245 + }, + { + "epoch": 1.2, + "learning_rate": 2.4486000000000002e-05, + "loss": 0.1532, + "step": 12250 + }, + { + "epoch": 1.2, + "learning_rate": 2.4496e-05, + "loss": 0.1382, + "step": 12255 + }, + { + "epoch": 1.2, + "learning_rate": 2.4506e-05, + "loss": 0.1678, + "step": 12260 + }, + { + "epoch": 1.2, + "learning_rate": 2.4516e-05, + "loss": 0.1553, + "step": 12265 + }, + { + "epoch": 1.2, + "learning_rate": 2.4526000000000002e-05, + "loss": 0.1542, + "step": 12270 + }, + { + "epoch": 1.2, + "learning_rate": 2.4536e-05, + "loss": 0.166, + "step": 12275 + }, + { + "epoch": 1.2, + "learning_rate": 2.4546000000000002e-05, + "loss": 0.1772, + "step": 12280 + }, + { + "epoch": 1.2, + "learning_rate": 2.4556e-05, + "loss": 0.1652, + "step": 12285 + }, + { + "epoch": 1.2, + "learning_rate": 2.4565999999999998e-05, + "loss": 0.1307, + "step": 12290 + }, + { + "epoch": 1.2, + "learning_rate": 2.4576000000000003e-05, + "loss": 0.1694, + "step": 12295 + }, + { + "epoch": 1.2, + "learning_rate": 2.4586e-05, + "loss": 0.1519, + "step": 12300 + }, + { + "epoch": 1.2, + "learning_rate": 2.4596e-05, + "loss": 0.1421, + "step": 12305 + }, + { + "epoch": 1.2, + "learning_rate": 2.4606e-05, + "loss": 0.1744, + "step": 12310 + }, + { + "epoch": 1.2, + "learning_rate": 2.4616e-05, + "loss": 0.165, + "step": 12315 + }, + { + "epoch": 1.2, + "learning_rate": 2.4626e-05, + "loss": 0.1351, + "step": 12320 + }, + { + "epoch": 1.21, + "learning_rate": 2.4636000000000003e-05, + "loss": 0.1615, + "step": 12325 + }, + { + "epoch": 1.21, + "learning_rate": 2.4646e-05, + "loss": 0.1621, + "step": 12330 + }, + { + "epoch": 1.21, + "learning_rate": 2.4656e-05, + "loss": 0.1463, + "step": 12335 + }, + { + "epoch": 1.21, + "learning_rate": 2.4666e-05, + "loss": 0.1474, + "step": 12340 + }, + { + "epoch": 1.21, + "learning_rate": 2.4676000000000002e-05, + "loss": 0.1735, + "step": 12345 + }, + { + "epoch": 1.21, + "learning_rate": 2.4686e-05, + "loss": 0.1368, + "step": 12350 + }, + { + "epoch": 1.21, + "learning_rate": 2.4696000000000002e-05, + "loss": 0.1403, + "step": 12355 + }, + { + "epoch": 1.21, + "learning_rate": 2.4706e-05, + "loss": 0.1616, + "step": 12360 + }, + { + "epoch": 1.21, + "learning_rate": 2.4716e-05, + "loss": 0.1747, + "step": 12365 + }, + { + "epoch": 1.21, + "learning_rate": 2.4726000000000003e-05, + "loss": 0.1319, + "step": 12370 + }, + { + "epoch": 1.21, + "learning_rate": 2.4736e-05, + "loss": 0.1658, + "step": 12375 + }, + { + "epoch": 1.21, + "learning_rate": 2.4746e-05, + "loss": 0.1683, + "step": 12380 + }, + { + "epoch": 1.21, + "learning_rate": 2.4756e-05, + "loss": 0.1433, + "step": 12385 + }, + { + "epoch": 1.21, + "learning_rate": 2.4766e-05, + "loss": 0.1454, + "step": 12390 + }, + { + "epoch": 1.21, + "learning_rate": 2.4776e-05, + "loss": 0.1765, + "step": 12395 + }, + { + "epoch": 1.21, + "learning_rate": 2.4786000000000003e-05, + "loss": 0.1504, + "step": 12400 + }, + { + "epoch": 1.21, + "learning_rate": 2.4796e-05, + "loss": 0.1305, + "step": 12405 + }, + { + "epoch": 1.21, + "learning_rate": 2.4806e-05, + "loss": 0.1639, + "step": 12410 + }, + { + "epoch": 1.21, + "learning_rate": 2.4816e-05, + "loss": 0.1629, + "step": 12415 + }, + { + "epoch": 1.21, + "learning_rate": 2.4826000000000003e-05, + "loss": 0.1564, + "step": 12420 + }, + { + "epoch": 1.21, + "learning_rate": 2.4836e-05, + "loss": 0.1543, + "step": 12425 + }, + { + "epoch": 1.22, + "learning_rate": 2.4846000000000002e-05, + "loss": 0.1755, + "step": 12430 + }, + { + "epoch": 1.22, + "learning_rate": 2.4856e-05, + "loss": 0.1509, + "step": 12435 + }, + { + "epoch": 1.22, + "learning_rate": 2.4866e-05, + "loss": 0.1417, + "step": 12440 + }, + { + "epoch": 1.22, + "learning_rate": 2.4876000000000004e-05, + "loss": 0.175, + "step": 12445 + }, + { + "epoch": 1.22, + "learning_rate": 2.4886000000000002e-05, + "loss": 0.1611, + "step": 12450 + }, + { + "epoch": 1.22, + "learning_rate": 2.4896e-05, + "loss": 0.1354, + "step": 12455 + }, + { + "epoch": 1.22, + "learning_rate": 2.4906000000000002e-05, + "loss": 0.1922, + "step": 12460 + }, + { + "epoch": 1.22, + "learning_rate": 2.4916e-05, + "loss": 0.1632, + "step": 12465 + }, + { + "epoch": 1.22, + "learning_rate": 2.4926e-05, + "loss": 0.1418, + "step": 12470 + }, + { + "epoch": 1.22, + "learning_rate": 2.4936000000000003e-05, + "loss": 0.1367, + "step": 12475 + }, + { + "epoch": 1.22, + "learning_rate": 2.4946e-05, + "loss": 0.1932, + "step": 12480 + }, + { + "epoch": 1.22, + "learning_rate": 2.4956e-05, + "loss": 0.1544, + "step": 12485 + }, + { + "epoch": 1.22, + "learning_rate": 2.4966e-05, + "loss": 0.1502, + "step": 12490 + }, + { + "epoch": 1.22, + "learning_rate": 2.4976e-05, + "loss": 0.1615, + "step": 12495 + }, + { + "epoch": 1.22, + "learning_rate": 2.4986e-05, + "loss": 0.1506, + "step": 12500 + }, + { + "epoch": 1.22, + "eval_cer": 0.06667845936490539, + "eval_loss": 0.2891385555267334, + "eval_runtime": 269.3231, + "eval_samples_per_second": 60.782, + "eval_steps_per_second": 1.689, + "eval_wer": 0.1733739054347897, + "step": 12500 + }, + { + "epoch": 1.22, + "learning_rate": 2.4996000000000003e-05, + "loss": 0.1485, + "step": 12505 + }, + { + "epoch": 1.22, + "learning_rate": 2.5006e-05, + "loss": 0.1668, + "step": 12510 + }, + { + "epoch": 1.22, + "learning_rate": 2.5016e-05, + "loss": 0.1541, + "step": 12515 + }, + { + "epoch": 1.22, + "learning_rate": 2.5026e-05, + "loss": 0.1456, + "step": 12520 + }, + { + "epoch": 1.22, + "learning_rate": 2.5036000000000002e-05, + "loss": 0.1463, + "step": 12525 + }, + { + "epoch": 1.23, + "learning_rate": 2.5046e-05, + "loss": 0.1804, + "step": 12530 + }, + { + "epoch": 1.23, + "learning_rate": 2.5056000000000002e-05, + "loss": 0.1427, + "step": 12535 + }, + { + "epoch": 1.23, + "learning_rate": 2.5066e-05, + "loss": 0.1474, + "step": 12540 + }, + { + "epoch": 1.23, + "learning_rate": 2.5076e-05, + "loss": 0.1758, + "step": 12545 + }, + { + "epoch": 1.23, + "learning_rate": 2.5086000000000003e-05, + "loss": 0.1644, + "step": 12550 + }, + { + "epoch": 1.23, + "learning_rate": 2.5096e-05, + "loss": 0.1556, + "step": 12555 + }, + { + "epoch": 1.23, + "learning_rate": 2.5106e-05, + "loss": 0.1424, + "step": 12560 + }, + { + "epoch": 1.23, + "learning_rate": 2.5116e-05, + "loss": 0.1806, + "step": 12565 + }, + { + "epoch": 1.23, + "learning_rate": 2.5126e-05, + "loss": 0.139, + "step": 12570 + }, + { + "epoch": 1.23, + "learning_rate": 2.5136e-05, + "loss": 0.1315, + "step": 12575 + }, + { + "epoch": 1.23, + "learning_rate": 2.5146e-05, + "loss": 0.1705, + "step": 12580 + }, + { + "epoch": 1.23, + "learning_rate": 2.5156e-05, + "loss": 0.1629, + "step": 12585 + }, + { + "epoch": 1.23, + "learning_rate": 2.5166e-05, + "loss": 0.1365, + "step": 12590 + }, + { + "epoch": 1.23, + "learning_rate": 2.5175999999999997e-05, + "loss": 0.17, + "step": 12595 + }, + { + "epoch": 1.23, + "learning_rate": 2.5186000000000002e-05, + "loss": 0.1573, + "step": 12600 + }, + { + "epoch": 1.23, + "learning_rate": 2.5196e-05, + "loss": 0.1388, + "step": 12605 + }, + { + "epoch": 1.23, + "learning_rate": 2.5206e-05, + "loss": 0.1623, + "step": 12610 + }, + { + "epoch": 1.23, + "learning_rate": 2.5216e-05, + "loss": 0.1639, + "step": 12615 + }, + { + "epoch": 1.23, + "learning_rate": 2.5226e-05, + "loss": 0.1435, + "step": 12620 + }, + { + "epoch": 1.23, + "learning_rate": 2.5236e-05, + "loss": 0.1675, + "step": 12625 + }, + { + "epoch": 1.24, + "learning_rate": 2.5246000000000002e-05, + "loss": 0.172, + "step": 12630 + }, + { + "epoch": 1.24, + "learning_rate": 2.5256e-05, + "loss": 0.1671, + "step": 12635 + }, + { + "epoch": 1.24, + "learning_rate": 2.5266e-05, + "loss": 0.141, + "step": 12640 + }, + { + "epoch": 1.24, + "learning_rate": 2.5276e-05, + "loss": 0.1763, + "step": 12645 + }, + { + "epoch": 1.24, + "learning_rate": 2.5286e-05, + "loss": 0.1575, + "step": 12650 + }, + { + "epoch": 1.24, + "learning_rate": 2.5296e-05, + "loss": 0.1383, + "step": 12655 + }, + { + "epoch": 1.24, + "learning_rate": 2.5306e-05, + "loss": 0.1414, + "step": 12660 + }, + { + "epoch": 1.24, + "learning_rate": 2.5316e-05, + "loss": 0.1663, + "step": 12665 + }, + { + "epoch": 1.24, + "learning_rate": 2.5325999999999998e-05, + "loss": 0.1348, + "step": 12670 + }, + { + "epoch": 1.24, + "learning_rate": 2.5336000000000003e-05, + "loss": 0.1488, + "step": 12675 + }, + { + "epoch": 1.24, + "learning_rate": 2.5346e-05, + "loss": 0.1674, + "step": 12680 + }, + { + "epoch": 1.24, + "learning_rate": 2.5356e-05, + "loss": 0.1411, + "step": 12685 + }, + { + "epoch": 1.24, + "learning_rate": 2.5366e-05, + "loss": 0.1383, + "step": 12690 + }, + { + "epoch": 1.24, + "learning_rate": 2.5376e-05, + "loss": 0.176, + "step": 12695 + }, + { + "epoch": 1.24, + "learning_rate": 2.5386e-05, + "loss": 0.1467, + "step": 12700 + }, + { + "epoch": 1.24, + "learning_rate": 2.5396000000000002e-05, + "loss": 0.1394, + "step": 12705 + }, + { + "epoch": 1.24, + "learning_rate": 2.5406e-05, + "loss": 0.1963, + "step": 12710 + }, + { + "epoch": 1.24, + "learning_rate": 2.5416e-05, + "loss": 0.1612, + "step": 12715 + }, + { + "epoch": 1.24, + "learning_rate": 2.5426e-05, + "loss": 0.1506, + "step": 12720 + }, + { + "epoch": 1.24, + "learning_rate": 2.5436000000000002e-05, + "loss": 0.1897, + "step": 12725 + }, + { + "epoch": 1.24, + "learning_rate": 2.5446e-05, + "loss": 0.1719, + "step": 12730 + }, + { + "epoch": 1.25, + "learning_rate": 2.5456e-05, + "loss": 0.1427, + "step": 12735 + }, + { + "epoch": 1.25, + "learning_rate": 2.5466e-05, + "loss": 0.143, + "step": 12740 + }, + { + "epoch": 1.25, + "learning_rate": 2.5475999999999998e-05, + "loss": 0.1467, + "step": 12745 + }, + { + "epoch": 1.25, + "learning_rate": 2.5486000000000003e-05, + "loss": 0.1535, + "step": 12750 + }, + { + "epoch": 1.25, + "learning_rate": 2.5496e-05, + "loss": 0.1605, + "step": 12755 + }, + { + "epoch": 1.25, + "learning_rate": 2.5506e-05, + "loss": 0.1742, + "step": 12760 + }, + { + "epoch": 1.25, + "learning_rate": 2.5516e-05, + "loss": 0.1599, + "step": 12765 + }, + { + "epoch": 1.25, + "learning_rate": 2.5526e-05, + "loss": 0.1575, + "step": 12770 + }, + { + "epoch": 1.25, + "learning_rate": 2.5536e-05, + "loss": 0.1622, + "step": 12775 + }, + { + "epoch": 1.25, + "learning_rate": 2.5546000000000002e-05, + "loss": 0.1555, + "step": 12780 + }, + { + "epoch": 1.25, + "learning_rate": 2.5556e-05, + "loss": 0.1499, + "step": 12785 + }, + { + "epoch": 1.25, + "learning_rate": 2.5566e-05, + "loss": 0.1514, + "step": 12790 + }, + { + "epoch": 1.25, + "learning_rate": 2.5576e-05, + "loss": 0.1703, + "step": 12795 + }, + { + "epoch": 1.25, + "learning_rate": 2.5586000000000002e-05, + "loss": 0.1663, + "step": 12800 + }, + { + "epoch": 1.25, + "learning_rate": 2.5596e-05, + "loss": 0.1314, + "step": 12805 + }, + { + "epoch": 1.25, + "learning_rate": 2.5606000000000002e-05, + "loss": 0.1732, + "step": 12810 + }, + { + "epoch": 1.25, + "learning_rate": 2.5616e-05, + "loss": 0.1756, + "step": 12815 + }, + { + "epoch": 1.25, + "learning_rate": 2.5625999999999998e-05, + "loss": 0.1384, + "step": 12820 + }, + { + "epoch": 1.25, + "learning_rate": 2.5636000000000003e-05, + "loss": 0.1428, + "step": 12825 + }, + { + "epoch": 1.25, + "learning_rate": 2.5646e-05, + "loss": 0.1804, + "step": 12830 + }, + { + "epoch": 1.26, + "learning_rate": 2.5656e-05, + "loss": 0.1604, + "step": 12835 + }, + { + "epoch": 1.26, + "learning_rate": 2.5666e-05, + "loss": 0.1422, + "step": 12840 + }, + { + "epoch": 1.26, + "learning_rate": 2.5676e-05, + "loss": 0.1659, + "step": 12845 + }, + { + "epoch": 1.26, + "learning_rate": 2.5686e-05, + "loss": 0.1477, + "step": 12850 + }, + { + "epoch": 1.26, + "learning_rate": 2.5696000000000003e-05, + "loss": 0.1725, + "step": 12855 + }, + { + "epoch": 1.26, + "learning_rate": 2.5706e-05, + "loss": 0.1557, + "step": 12860 + }, + { + "epoch": 1.26, + "learning_rate": 2.5716e-05, + "loss": 0.1648, + "step": 12865 + }, + { + "epoch": 1.26, + "learning_rate": 2.5726e-05, + "loss": 0.148, + "step": 12870 + }, + { + "epoch": 1.26, + "learning_rate": 2.5736000000000002e-05, + "loss": 0.1438, + "step": 12875 + }, + { + "epoch": 1.26, + "learning_rate": 2.5746e-05, + "loss": 0.1757, + "step": 12880 + }, + { + "epoch": 1.26, + "learning_rate": 2.5756000000000002e-05, + "loss": 0.1303, + "step": 12885 + }, + { + "epoch": 1.26, + "learning_rate": 2.5766e-05, + "loss": 0.1544, + "step": 12890 + }, + { + "epoch": 1.26, + "learning_rate": 2.5776e-05, + "loss": 0.1573, + "step": 12895 + }, + { + "epoch": 1.26, + "learning_rate": 2.5786e-05, + "loss": 0.1509, + "step": 12900 + }, + { + "epoch": 1.26, + "learning_rate": 2.5796000000000002e-05, + "loss": 0.1285, + "step": 12905 + }, + { + "epoch": 1.26, + "learning_rate": 2.5806e-05, + "loss": 0.1496, + "step": 12910 + }, + { + "epoch": 1.26, + "learning_rate": 2.5816e-05, + "loss": 0.1686, + "step": 12915 + }, + { + "epoch": 1.26, + "learning_rate": 2.5826e-05, + "loss": 0.1381, + "step": 12920 + }, + { + "epoch": 1.26, + "learning_rate": 2.5835999999999998e-05, + "loss": 0.1538, + "step": 12925 + }, + { + "epoch": 1.26, + "learning_rate": 2.5846000000000003e-05, + "loss": 0.2035, + "step": 12930 + }, + { + "epoch": 1.26, + "learning_rate": 2.5856e-05, + "loss": 0.1505, + "step": 12935 + }, + { + "epoch": 1.27, + "learning_rate": 2.5866e-05, + "loss": 0.1403, + "step": 12940 + }, + { + "epoch": 1.27, + "learning_rate": 2.5876e-05, + "loss": 0.1882, + "step": 12945 + }, + { + "epoch": 1.27, + "learning_rate": 2.5886e-05, + "loss": 0.161, + "step": 12950 + }, + { + "epoch": 1.27, + "learning_rate": 2.5896e-05, + "loss": 0.1303, + "step": 12955 + }, + { + "epoch": 1.27, + "learning_rate": 2.5906000000000002e-05, + "loss": 0.1581, + "step": 12960 + }, + { + "epoch": 1.27, + "learning_rate": 2.5916e-05, + "loss": 0.1535, + "step": 12965 + }, + { + "epoch": 1.27, + "learning_rate": 2.5926e-05, + "loss": 0.1582, + "step": 12970 + }, + { + "epoch": 1.27, + "learning_rate": 2.5936e-05, + "loss": 0.1578, + "step": 12975 + }, + { + "epoch": 1.27, + "learning_rate": 2.5946000000000002e-05, + "loss": 0.1479, + "step": 12980 + }, + { + "epoch": 1.27, + "learning_rate": 2.5956e-05, + "loss": 0.1446, + "step": 12985 + }, + { + "epoch": 1.27, + "learning_rate": 2.5966000000000002e-05, + "loss": 0.1307, + "step": 12990 + }, + { + "epoch": 1.27, + "learning_rate": 2.5976e-05, + "loss": 0.1569, + "step": 12995 + }, + { + "epoch": 1.27, + "learning_rate": 2.5985999999999998e-05, + "loss": 0.1621, + "step": 13000 + }, + { + "epoch": 1.27, + "eval_cer": 0.0669351239736306, + "eval_loss": 0.28366291522979736, + "eval_runtime": 269.0715, + "eval_samples_per_second": 60.839, + "eval_steps_per_second": 1.691, + "eval_wer": 0.17215282448430552, + "step": 13000 + }, + { + "epoch": 1.27, + "learning_rate": 2.5996000000000003e-05, + "loss": 0.1383, + "step": 13005 + }, + { + "epoch": 1.27, + "learning_rate": 2.6006e-05, + "loss": 0.1684, + "step": 13010 + }, + { + "epoch": 1.27, + "learning_rate": 2.6016e-05, + "loss": 0.158, + "step": 13015 + }, + { + "epoch": 1.27, + "learning_rate": 2.6026e-05, + "loss": 0.1432, + "step": 13020 + }, + { + "epoch": 1.27, + "learning_rate": 2.6036e-05, + "loss": 0.1456, + "step": 13025 + }, + { + "epoch": 1.27, + "learning_rate": 2.6046e-05, + "loss": 0.1755, + "step": 13030 + }, + { + "epoch": 1.27, + "learning_rate": 2.6056000000000003e-05, + "loss": 0.1448, + "step": 13035 + }, + { + "epoch": 1.28, + "learning_rate": 2.6066e-05, + "loss": 0.1299, + "step": 13040 + }, + { + "epoch": 1.28, + "learning_rate": 2.6076e-05, + "loss": 0.1771, + "step": 13045 + }, + { + "epoch": 1.28, + "learning_rate": 2.6086e-05, + "loss": 0.1553, + "step": 13050 + }, + { + "epoch": 1.28, + "learning_rate": 2.6096000000000002e-05, + "loss": 0.1389, + "step": 13055 + }, + { + "epoch": 1.28, + "learning_rate": 2.6106e-05, + "loss": 0.1579, + "step": 13060 + }, + { + "epoch": 1.28, + "learning_rate": 2.6116000000000002e-05, + "loss": 0.1548, + "step": 13065 + }, + { + "epoch": 1.28, + "learning_rate": 2.6126e-05, + "loss": 0.1433, + "step": 13070 + }, + { + "epoch": 1.28, + "learning_rate": 2.6136e-05, + "loss": 0.1383, + "step": 13075 + }, + { + "epoch": 1.28, + "learning_rate": 2.6146000000000003e-05, + "loss": 0.1634, + "step": 13080 + }, + { + "epoch": 1.28, + "learning_rate": 2.6156e-05, + "loss": 0.141, + "step": 13085 + }, + { + "epoch": 1.28, + "learning_rate": 2.6166e-05, + "loss": 0.1193, + "step": 13090 + }, + { + "epoch": 1.28, + "learning_rate": 2.6176e-05, + "loss": 0.1831, + "step": 13095 + }, + { + "epoch": 1.28, + "learning_rate": 2.6186e-05, + "loss": 0.1528, + "step": 13100 + }, + { + "epoch": 1.28, + "learning_rate": 2.6196e-05, + "loss": 0.1372, + "step": 13105 + }, + { + "epoch": 1.28, + "learning_rate": 2.6206000000000003e-05, + "loss": 0.1541, + "step": 13110 + }, + { + "epoch": 1.28, + "learning_rate": 2.6216e-05, + "loss": 0.1487, + "step": 13115 + }, + { + "epoch": 1.28, + "learning_rate": 2.6226e-05, + "loss": 0.1668, + "step": 13120 + }, + { + "epoch": 1.28, + "learning_rate": 2.6236e-05, + "loss": 0.1572, + "step": 13125 + }, + { + "epoch": 1.28, + "learning_rate": 2.6246000000000002e-05, + "loss": 0.1725, + "step": 13130 + }, + { + "epoch": 1.28, + "learning_rate": 2.6256e-05, + "loss": 0.143, + "step": 13135 + }, + { + "epoch": 1.28, + "learning_rate": 2.6266000000000002e-05, + "loss": 0.1489, + "step": 13140 + }, + { + "epoch": 1.29, + "learning_rate": 2.6276e-05, + "loss": 0.1638, + "step": 13145 + }, + { + "epoch": 1.29, + "learning_rate": 2.6286e-05, + "loss": 0.16, + "step": 13150 + }, + { + "epoch": 1.29, + "learning_rate": 2.6296000000000004e-05, + "loss": 0.1478, + "step": 13155 + }, + { + "epoch": 1.29, + "learning_rate": 2.6306000000000002e-05, + "loss": 0.1781, + "step": 13160 + }, + { + "epoch": 1.29, + "learning_rate": 2.6316e-05, + "loss": 0.1753, + "step": 13165 + }, + { + "epoch": 1.29, + "learning_rate": 2.6326000000000002e-05, + "loss": 0.1414, + "step": 13170 + }, + { + "epoch": 1.29, + "learning_rate": 2.6336e-05, + "loss": 0.1674, + "step": 13175 + }, + { + "epoch": 1.29, + "learning_rate": 2.6346e-05, + "loss": 0.1889, + "step": 13180 + }, + { + "epoch": 1.29, + "learning_rate": 2.6356000000000003e-05, + "loss": 0.1539, + "step": 13185 + }, + { + "epoch": 1.29, + "learning_rate": 2.6366e-05, + "loss": 0.1455, + "step": 13190 + }, + { + "epoch": 1.29, + "learning_rate": 2.6376e-05, + "loss": 0.1835, + "step": 13195 + }, + { + "epoch": 1.29, + "learning_rate": 2.6385999999999998e-05, + "loss": 0.1583, + "step": 13200 + }, + { + "epoch": 1.29, + "learning_rate": 2.6396000000000003e-05, + "loss": 0.1422, + "step": 13205 + }, + { + "epoch": 1.29, + "learning_rate": 2.6406e-05, + "loss": 0.1485, + "step": 13210 + }, + { + "epoch": 1.29, + "learning_rate": 2.6416e-05, + "loss": 0.1714, + "step": 13215 + }, + { + "epoch": 1.29, + "learning_rate": 2.6426e-05, + "loss": 0.153, + "step": 13220 + }, + { + "epoch": 1.29, + "learning_rate": 2.6436e-05, + "loss": 0.1631, + "step": 13225 + }, + { + "epoch": 1.29, + "learning_rate": 2.6446e-05, + "loss": 0.1846, + "step": 13230 + }, + { + "epoch": 1.29, + "learning_rate": 2.6456000000000002e-05, + "loss": 0.1326, + "step": 13235 + }, + { + "epoch": 1.29, + "learning_rate": 2.6466e-05, + "loss": 0.1603, + "step": 13240 + }, + { + "epoch": 1.3, + "learning_rate": 2.6476e-05, + "loss": 0.1794, + "step": 13245 + }, + { + "epoch": 1.3, + "learning_rate": 2.6486e-05, + "loss": 0.1608, + "step": 13250 + }, + { + "epoch": 1.3, + "learning_rate": 2.6496000000000002e-05, + "loss": 0.141, + "step": 13255 + }, + { + "epoch": 1.3, + "learning_rate": 2.6506e-05, + "loss": 0.1471, + "step": 13260 + }, + { + "epoch": 1.3, + "learning_rate": 2.6516e-05, + "loss": 0.1548, + "step": 13265 + }, + { + "epoch": 1.3, + "learning_rate": 2.6526e-05, + "loss": 0.1307, + "step": 13270 + }, + { + "epoch": 1.3, + "learning_rate": 2.6535999999999998e-05, + "loss": 0.143, + "step": 13275 + }, + { + "epoch": 1.3, + "learning_rate": 2.6546000000000003e-05, + "loss": 0.1914, + "step": 13280 + }, + { + "epoch": 1.3, + "learning_rate": 2.6556e-05, + "loss": 0.1419, + "step": 13285 + }, + { + "epoch": 1.3, + "learning_rate": 2.6566e-05, + "loss": 0.1393, + "step": 13290 + }, + { + "epoch": 1.3, + "learning_rate": 2.6576e-05, + "loss": 0.1881, + "step": 13295 + }, + { + "epoch": 1.3, + "learning_rate": 2.6586e-05, + "loss": 0.1583, + "step": 13300 + }, + { + "epoch": 1.3, + "learning_rate": 2.6596e-05, + "loss": 0.1474, + "step": 13305 + }, + { + "epoch": 1.3, + "learning_rate": 2.6606000000000002e-05, + "loss": 0.1628, + "step": 13310 + }, + { + "epoch": 1.3, + "learning_rate": 2.6616e-05, + "loss": 0.1785, + "step": 13315 + }, + { + "epoch": 1.3, + "learning_rate": 2.6626e-05, + "loss": 0.1386, + "step": 13320 + }, + { + "epoch": 1.3, + "learning_rate": 2.6636e-05, + "loss": 0.1393, + "step": 13325 + }, + { + "epoch": 1.3, + "learning_rate": 2.6646000000000002e-05, + "loss": 0.1806, + "step": 13330 + }, + { + "epoch": 1.3, + "learning_rate": 2.6656e-05, + "loss": 0.1517, + "step": 13335 + }, + { + "epoch": 1.3, + "learning_rate": 2.6666000000000002e-05, + "loss": 0.1501, + "step": 13340 + }, + { + "epoch": 1.3, + "learning_rate": 2.6676e-05, + "loss": 0.1737, + "step": 13345 + }, + { + "epoch": 1.31, + "learning_rate": 2.6685999999999998e-05, + "loss": 0.1539, + "step": 13350 + }, + { + "epoch": 1.31, + "learning_rate": 2.6696e-05, + "loss": 0.1394, + "step": 13355 + }, + { + "epoch": 1.31, + "learning_rate": 2.6706e-05, + "loss": 0.1889, + "step": 13360 + }, + { + "epoch": 1.31, + "learning_rate": 2.6716e-05, + "loss": 0.1582, + "step": 13365 + }, + { + "epoch": 1.31, + "learning_rate": 2.6726e-05, + "loss": 0.1264, + "step": 13370 + }, + { + "epoch": 1.31, + "learning_rate": 2.6736e-05, + "loss": 0.1337, + "step": 13375 + }, + { + "epoch": 1.31, + "learning_rate": 2.6745999999999998e-05, + "loss": 0.1845, + "step": 13380 + }, + { + "epoch": 1.31, + "learning_rate": 2.6756000000000003e-05, + "loss": 0.147, + "step": 13385 + }, + { + "epoch": 1.31, + "learning_rate": 2.6766e-05, + "loss": 0.1456, + "step": 13390 + }, + { + "epoch": 1.31, + "learning_rate": 2.6776e-05, + "loss": 0.1723, + "step": 13395 + }, + { + "epoch": 1.31, + "learning_rate": 2.6786e-05, + "loss": 0.162, + "step": 13400 + }, + { + "epoch": 1.31, + "learning_rate": 2.6796e-05, + "loss": 0.1155, + "step": 13405 + }, + { + "epoch": 1.31, + "learning_rate": 2.6806e-05, + "loss": 0.1495, + "step": 13410 + }, + { + "epoch": 1.31, + "learning_rate": 2.6816000000000002e-05, + "loss": 0.161, + "step": 13415 + }, + { + "epoch": 1.31, + "learning_rate": 2.6826e-05, + "loss": 0.1246, + "step": 13420 + }, + { + "epoch": 1.31, + "learning_rate": 2.6836e-05, + "loss": 0.1406, + "step": 13425 + }, + { + "epoch": 1.31, + "learning_rate": 2.6846e-05, + "loss": 0.1627, + "step": 13430 + }, + { + "epoch": 1.31, + "learning_rate": 2.6856000000000002e-05, + "loss": 0.1349, + "step": 13435 + }, + { + "epoch": 1.31, + "learning_rate": 2.6866e-05, + "loss": 0.1423, + "step": 13440 + }, + { + "epoch": 1.31, + "learning_rate": 2.6876e-05, + "loss": 0.1784, + "step": 13445 + }, + { + "epoch": 1.32, + "learning_rate": 2.6886e-05, + "loss": 0.1548, + "step": 13450 + }, + { + "epoch": 1.32, + "learning_rate": 2.6895999999999998e-05, + "loss": 0.1449, + "step": 13455 + }, + { + "epoch": 1.32, + "learning_rate": 2.6906000000000003e-05, + "loss": 0.1644, + "step": 13460 + }, + { + "epoch": 1.32, + "learning_rate": 2.6916e-05, + "loss": 0.1533, + "step": 13465 + }, + { + "epoch": 1.32, + "learning_rate": 2.6926e-05, + "loss": 0.1397, + "step": 13470 + }, + { + "epoch": 1.32, + "learning_rate": 2.6936e-05, + "loss": 0.165, + "step": 13475 + }, + { + "epoch": 1.32, + "learning_rate": 2.6946e-05, + "loss": 0.1867, + "step": 13480 + }, + { + "epoch": 1.32, + "learning_rate": 2.6956e-05, + "loss": 0.1417, + "step": 13485 + }, + { + "epoch": 1.32, + "learning_rate": 2.6966000000000002e-05, + "loss": 0.1317, + "step": 13490 + }, + { + "epoch": 1.32, + "learning_rate": 2.6976e-05, + "loss": 0.1555, + "step": 13495 + }, + { + "epoch": 1.32, + "learning_rate": 2.6986e-05, + "loss": 0.1573, + "step": 13500 + }, + { + "epoch": 1.32, + "eval_cer": 0.06601251875848323, + "eval_loss": 0.27916088700294495, + "eval_runtime": 273.5283, + "eval_samples_per_second": 59.848, + "eval_steps_per_second": 1.663, + "eval_wer": 0.17279927910515008, + "step": 13500 + }, + { + "epoch": 1.32, + "learning_rate": 2.6996e-05, + "loss": 0.1497, + "step": 13505 + }, + { + "epoch": 1.32, + "learning_rate": 2.7006000000000002e-05, + "loss": 0.179, + "step": 13510 + }, + { + "epoch": 1.32, + "learning_rate": 2.7016e-05, + "loss": 0.1612, + "step": 13515 + }, + { + "epoch": 1.32, + "learning_rate": 2.7026000000000002e-05, + "loss": 0.1421, + "step": 13520 + }, + { + "epoch": 1.32, + "learning_rate": 2.7036e-05, + "loss": 0.1457, + "step": 13525 + }, + { + "epoch": 1.32, + "learning_rate": 2.7045999999999998e-05, + "loss": 0.1666, + "step": 13530 + }, + { + "epoch": 1.32, + "learning_rate": 2.7056000000000003e-05, + "loss": 0.1539, + "step": 13535 + }, + { + "epoch": 1.32, + "learning_rate": 2.7066e-05, + "loss": 0.1615, + "step": 13540 + }, + { + "epoch": 1.32, + "learning_rate": 2.7076e-05, + "loss": 0.1674, + "step": 13545 + }, + { + "epoch": 1.32, + "learning_rate": 2.7086e-05, + "loss": 0.1717, + "step": 13550 + }, + { + "epoch": 1.33, + "learning_rate": 2.7096e-05, + "loss": 0.1373, + "step": 13555 + }, + { + "epoch": 1.33, + "learning_rate": 2.7106e-05, + "loss": 0.1677, + "step": 13560 + }, + { + "epoch": 1.33, + "learning_rate": 2.7116000000000003e-05, + "loss": 0.1795, + "step": 13565 + }, + { + "epoch": 1.33, + "learning_rate": 2.7126e-05, + "loss": 0.1241, + "step": 13570 + }, + { + "epoch": 1.33, + "learning_rate": 2.7136e-05, + "loss": 0.1655, + "step": 13575 + }, + { + "epoch": 1.33, + "learning_rate": 2.7146e-05, + "loss": 0.1637, + "step": 13580 + }, + { + "epoch": 1.33, + "learning_rate": 2.7156000000000002e-05, + "loss": 0.1369, + "step": 13585 + }, + { + "epoch": 1.33, + "learning_rate": 2.7166e-05, + "loss": 0.1366, + "step": 13590 + }, + { + "epoch": 1.33, + "learning_rate": 2.7176000000000002e-05, + "loss": 0.1895, + "step": 13595 + }, + { + "epoch": 1.33, + "learning_rate": 2.7186e-05, + "loss": 0.1537, + "step": 13600 + }, + { + "epoch": 1.33, + "learning_rate": 2.7196e-05, + "loss": 0.1561, + "step": 13605 + }, + { + "epoch": 1.33, + "learning_rate": 2.7206000000000003e-05, + "loss": 0.1623, + "step": 13610 + }, + { + "epoch": 1.33, + "learning_rate": 2.7216e-05, + "loss": 0.1631, + "step": 13615 + }, + { + "epoch": 1.33, + "learning_rate": 2.7226e-05, + "loss": 0.1334, + "step": 13620 + }, + { + "epoch": 1.33, + "learning_rate": 2.7236e-05, + "loss": 0.1582, + "step": 13625 + }, + { + "epoch": 1.33, + "learning_rate": 2.7246e-05, + "loss": 0.1864, + "step": 13630 + }, + { + "epoch": 1.33, + "learning_rate": 2.7256e-05, + "loss": 0.1383, + "step": 13635 + }, + { + "epoch": 1.33, + "learning_rate": 2.7266000000000003e-05, + "loss": 0.1424, + "step": 13640 + }, + { + "epoch": 1.33, + "learning_rate": 2.7276e-05, + "loss": 0.1937, + "step": 13645 + }, + { + "epoch": 1.33, + "learning_rate": 2.7286e-05, + "loss": 0.1462, + "step": 13650 + }, + { + "epoch": 1.34, + "learning_rate": 2.7296e-05, + "loss": 0.1491, + "step": 13655 + }, + { + "epoch": 1.34, + "learning_rate": 2.7306000000000002e-05, + "loss": 0.1582, + "step": 13660 + }, + { + "epoch": 1.34, + "learning_rate": 2.7316e-05, + "loss": 0.1637, + "step": 13665 + }, + { + "epoch": 1.34, + "learning_rate": 2.7326000000000002e-05, + "loss": 0.1408, + "step": 13670 + }, + { + "epoch": 1.34, + "learning_rate": 2.7336e-05, + "loss": 0.1373, + "step": 13675 + }, + { + "epoch": 1.34, + "learning_rate": 2.7346e-05, + "loss": 0.1895, + "step": 13680 + }, + { + "epoch": 1.34, + "learning_rate": 2.7356000000000004e-05, + "loss": 0.1596, + "step": 13685 + }, + { + "epoch": 1.34, + "learning_rate": 2.7366000000000002e-05, + "loss": 0.1485, + "step": 13690 + }, + { + "epoch": 1.34, + "learning_rate": 2.7376e-05, + "loss": 0.191, + "step": 13695 + }, + { + "epoch": 1.34, + "learning_rate": 2.7386000000000002e-05, + "loss": 0.1676, + "step": 13700 + }, + { + "epoch": 1.34, + "learning_rate": 2.7396e-05, + "loss": 0.1547, + "step": 13705 + }, + { + "epoch": 1.34, + "learning_rate": 2.7406e-05, + "loss": 0.1755, + "step": 13710 + }, + { + "epoch": 1.34, + "learning_rate": 2.7416000000000003e-05, + "loss": 0.1549, + "step": 13715 + }, + { + "epoch": 1.34, + "learning_rate": 2.7426e-05, + "loss": 0.153, + "step": 13720 + }, + { + "epoch": 1.34, + "learning_rate": 2.7436e-05, + "loss": 0.1407, + "step": 13725 + }, + { + "epoch": 1.34, + "learning_rate": 2.7446e-05, + "loss": 0.1724, + "step": 13730 + }, + { + "epoch": 1.34, + "learning_rate": 2.7456000000000003e-05, + "loss": 0.1535, + "step": 13735 + }, + { + "epoch": 1.34, + "learning_rate": 2.7466e-05, + "loss": 0.1377, + "step": 13740 + }, + { + "epoch": 1.34, + "learning_rate": 2.7476000000000003e-05, + "loss": 0.1753, + "step": 13745 + }, + { + "epoch": 1.34, + "learning_rate": 2.7486e-05, + "loss": 0.1473, + "step": 13750 + }, + { + "epoch": 1.35, + "learning_rate": 2.7496e-05, + "loss": 0.1404, + "step": 13755 + }, + { + "epoch": 1.35, + "learning_rate": 2.7506e-05, + "loss": 0.1407, + "step": 13760 + }, + { + "epoch": 1.35, + "learning_rate": 2.7516000000000002e-05, + "loss": 0.1568, + "step": 13765 + }, + { + "epoch": 1.35, + "learning_rate": 2.7526e-05, + "loss": 0.141, + "step": 13770 + }, + { + "epoch": 1.35, + "learning_rate": 2.7536000000000002e-05, + "loss": 0.1356, + "step": 13775 + }, + { + "epoch": 1.35, + "learning_rate": 2.7546e-05, + "loss": 0.1964, + "step": 13780 + }, + { + "epoch": 1.35, + "learning_rate": 2.7556e-05, + "loss": 0.146, + "step": 13785 + }, + { + "epoch": 1.35, + "learning_rate": 2.7566000000000003e-05, + "loss": 0.1479, + "step": 13790 + }, + { + "epoch": 1.35, + "learning_rate": 2.7576e-05, + "loss": 0.1594, + "step": 13795 + }, + { + "epoch": 1.35, + "learning_rate": 2.7586e-05, + "loss": 0.164, + "step": 13800 + }, + { + "epoch": 1.35, + "learning_rate": 2.7596e-05, + "loss": 0.1504, + "step": 13805 + }, + { + "epoch": 1.35, + "learning_rate": 2.7606e-05, + "loss": 0.1597, + "step": 13810 + }, + { + "epoch": 1.35, + "learning_rate": 2.7616e-05, + "loss": 0.1608, + "step": 13815 + }, + { + "epoch": 1.35, + "learning_rate": 2.7626e-05, + "loss": 0.157, + "step": 13820 + }, + { + "epoch": 1.35, + "learning_rate": 2.7636e-05, + "loss": 0.1457, + "step": 13825 + }, + { + "epoch": 1.35, + "learning_rate": 2.7646e-05, + "loss": 0.1707, + "step": 13830 + }, + { + "epoch": 1.35, + "learning_rate": 2.7655999999999997e-05, + "loss": 0.1426, + "step": 13835 + }, + { + "epoch": 1.35, + "learning_rate": 2.7666000000000002e-05, + "loss": 0.1478, + "step": 13840 + }, + { + "epoch": 1.35, + "learning_rate": 2.7676e-05, + "loss": 0.1758, + "step": 13845 + }, + { + "epoch": 1.35, + "learning_rate": 2.7686e-05, + "loss": 0.1741, + "step": 13850 + }, + { + "epoch": 1.35, + "learning_rate": 2.7696e-05, + "loss": 0.1446, + "step": 13855 + }, + { + "epoch": 1.36, + "learning_rate": 2.7706e-05, + "loss": 0.1532, + "step": 13860 + }, + { + "epoch": 1.36, + "learning_rate": 2.7716e-05, + "loss": 0.175, + "step": 13865 + }, + { + "epoch": 1.36, + "learning_rate": 2.7726000000000002e-05, + "loss": 0.1493, + "step": 13870 + }, + { + "epoch": 1.36, + "learning_rate": 2.7736e-05, + "loss": 0.1627, + "step": 13875 + }, + { + "epoch": 1.36, + "learning_rate": 2.7745999999999998e-05, + "loss": 0.1669, + "step": 13880 + }, + { + "epoch": 1.36, + "learning_rate": 2.7756e-05, + "loss": 0.1291, + "step": 13885 + }, + { + "epoch": 1.36, + "learning_rate": 2.7766e-05, + "loss": 0.1323, + "step": 13890 + }, + { + "epoch": 1.36, + "learning_rate": 2.7776e-05, + "loss": 0.1765, + "step": 13895 + }, + { + "epoch": 1.36, + "learning_rate": 2.7786e-05, + "loss": 0.1504, + "step": 13900 + }, + { + "epoch": 1.36, + "learning_rate": 2.7796e-05, + "loss": 0.1517, + "step": 13905 + }, + { + "epoch": 1.36, + "learning_rate": 2.7805999999999998e-05, + "loss": 0.1622, + "step": 13910 + }, + { + "epoch": 1.36, + "learning_rate": 2.7816000000000003e-05, + "loss": 0.1689, + "step": 13915 + }, + { + "epoch": 1.36, + "learning_rate": 2.7826e-05, + "loss": 0.1567, + "step": 13920 + }, + { + "epoch": 1.36, + "learning_rate": 2.7836e-05, + "loss": 0.1489, + "step": 13925 + }, + { + "epoch": 1.36, + "learning_rate": 2.7846e-05, + "loss": 0.1745, + "step": 13930 + }, + { + "epoch": 1.36, + "learning_rate": 2.7856e-05, + "loss": 0.1377, + "step": 13935 + }, + { + "epoch": 1.36, + "learning_rate": 2.7866e-05, + "loss": 0.1374, + "step": 13940 + }, + { + "epoch": 1.36, + "learning_rate": 2.7876000000000002e-05, + "loss": 0.1665, + "step": 13945 + }, + { + "epoch": 1.36, + "learning_rate": 2.7886e-05, + "loss": 0.1397, + "step": 13950 + }, + { + "epoch": 1.36, + "learning_rate": 2.7896e-05, + "loss": 0.1435, + "step": 13955 + }, + { + "epoch": 1.37, + "learning_rate": 2.7906e-05, + "loss": 0.1951, + "step": 13960 + }, + { + "epoch": 1.37, + "learning_rate": 2.7916000000000002e-05, + "loss": 0.1633, + "step": 13965 + }, + { + "epoch": 1.37, + "learning_rate": 2.7926e-05, + "loss": 0.142, + "step": 13970 + }, + { + "epoch": 1.37, + "learning_rate": 2.7936e-05, + "loss": 0.1613, + "step": 13975 + }, + { + "epoch": 1.37, + "learning_rate": 2.7946e-05, + "loss": 0.2112, + "step": 13980 + }, + { + "epoch": 1.37, + "learning_rate": 2.7955999999999998e-05, + "loss": 0.15, + "step": 13985 + }, + { + "epoch": 1.37, + "learning_rate": 2.7966000000000003e-05, + "loss": 0.1686, + "step": 13990 + }, + { + "epoch": 1.37, + "learning_rate": 2.7976e-05, + "loss": 0.175, + "step": 13995 + }, + { + "epoch": 1.37, + "learning_rate": 2.7986e-05, + "loss": 0.1566, + "step": 14000 + }, + { + "epoch": 1.37, + "eval_cer": 0.06605182775261231, + "eval_loss": 0.2746506333351135, + "eval_runtime": 270.3795, + "eval_samples_per_second": 60.545, + "eval_steps_per_second": 1.683, + "eval_wer": 0.17023305015573678, + "step": 14000 + }, + { + "epoch": 1.37, + "learning_rate": 2.7996e-05, + "loss": 0.1439, + "step": 14005 + }, + { + "epoch": 1.37, + "learning_rate": 2.8006e-05, + "loss": 0.1585, + "step": 14010 + }, + { + "epoch": 1.37, + "learning_rate": 2.8016e-05, + "loss": 0.183, + "step": 14015 + }, + { + "epoch": 1.37, + "learning_rate": 2.8026000000000002e-05, + "loss": 0.1268, + "step": 14020 + }, + { + "epoch": 1.37, + "learning_rate": 2.8036e-05, + "loss": 0.141, + "step": 14025 + }, + { + "epoch": 1.37, + "learning_rate": 2.8046e-05, + "loss": 0.143, + "step": 14030 + }, + { + "epoch": 1.37, + "learning_rate": 2.8056e-05, + "loss": 0.1494, + "step": 14035 + }, + { + "epoch": 1.37, + "learning_rate": 2.8066000000000002e-05, + "loss": 0.1379, + "step": 14040 + }, + { + "epoch": 1.37, + "learning_rate": 2.8076e-05, + "loss": 0.1799, + "step": 14045 + }, + { + "epoch": 1.37, + "learning_rate": 2.8086000000000002e-05, + "loss": 0.14, + "step": 14050 + }, + { + "epoch": 1.37, + "learning_rate": 2.8096e-05, + "loss": 0.1406, + "step": 14055 + }, + { + "epoch": 1.37, + "learning_rate": 2.8105999999999998e-05, + "loss": 0.17, + "step": 14060 + }, + { + "epoch": 1.38, + "learning_rate": 2.8116000000000003e-05, + "loss": 0.1575, + "step": 14065 + }, + { + "epoch": 1.38, + "learning_rate": 2.8126e-05, + "loss": 0.1408, + "step": 14070 + }, + { + "epoch": 1.38, + "learning_rate": 2.8134e-05, + "loss": 0.1628, + "step": 14075 + }, + { + "epoch": 1.38, + "learning_rate": 2.8144000000000004e-05, + "loss": 0.1753, + "step": 14080 + }, + { + "epoch": 1.38, + "learning_rate": 2.8154000000000002e-05, + "loss": 0.1528, + "step": 14085 + }, + { + "epoch": 1.38, + "learning_rate": 2.8164e-05, + "loss": 0.1514, + "step": 14090 + }, + { + "epoch": 1.38, + "learning_rate": 2.8174e-05, + "loss": 0.1944, + "step": 14095 + }, + { + "epoch": 1.38, + "learning_rate": 2.8184e-05, + "loss": 0.1603, + "step": 14100 + }, + { + "epoch": 1.38, + "learning_rate": 2.8194e-05, + "loss": 0.1483, + "step": 14105 + }, + { + "epoch": 1.38, + "learning_rate": 2.8204000000000003e-05, + "loss": 0.151, + "step": 14110 + }, + { + "epoch": 1.38, + "learning_rate": 2.8214e-05, + "loss": 0.1525, + "step": 14115 + }, + { + "epoch": 1.38, + "learning_rate": 2.8224e-05, + "loss": 0.1614, + "step": 14120 + }, + { + "epoch": 1.38, + "learning_rate": 2.8234e-05, + "loss": 0.1439, + "step": 14125 + }, + { + "epoch": 1.38, + "learning_rate": 2.8244e-05, + "loss": 0.1891, + "step": 14130 + }, + { + "epoch": 1.38, + "learning_rate": 2.8254e-05, + "loss": 0.1429, + "step": 14135 + }, + { + "epoch": 1.38, + "learning_rate": 2.8264000000000002e-05, + "loss": 0.1643, + "step": 14140 + }, + { + "epoch": 1.38, + "learning_rate": 2.8274e-05, + "loss": 0.1616, + "step": 14145 + }, + { + "epoch": 1.38, + "learning_rate": 2.8284e-05, + "loss": 0.1509, + "step": 14150 + }, + { + "epoch": 1.38, + "learning_rate": 2.8294e-05, + "loss": 0.137, + "step": 14155 + }, + { + "epoch": 1.38, + "learning_rate": 2.8304000000000002e-05, + "loss": 0.1805, + "step": 14160 + }, + { + "epoch": 1.39, + "learning_rate": 2.8314e-05, + "loss": 0.1513, + "step": 14165 + }, + { + "epoch": 1.39, + "learning_rate": 2.8324000000000002e-05, + "loss": 0.138, + "step": 14170 + }, + { + "epoch": 1.39, + "learning_rate": 2.8334e-05, + "loss": 0.1674, + "step": 14175 + }, + { + "epoch": 1.39, + "learning_rate": 2.8344e-05, + "loss": 0.176, + "step": 14180 + }, + { + "epoch": 1.39, + "learning_rate": 2.8354000000000003e-05, + "loss": 0.1412, + "step": 14185 + }, + { + "epoch": 1.39, + "learning_rate": 2.8364e-05, + "loss": 0.1589, + "step": 14190 + }, + { + "epoch": 1.39, + "learning_rate": 2.8374e-05, + "loss": 0.1609, + "step": 14195 + }, + { + "epoch": 1.39, + "learning_rate": 2.8384e-05, + "loss": 0.1411, + "step": 14200 + }, + { + "epoch": 1.39, + "learning_rate": 2.8394e-05, + "loss": 0.1562, + "step": 14205 + }, + { + "epoch": 1.39, + "learning_rate": 2.8404e-05, + "loss": 0.155, + "step": 14210 + }, + { + "epoch": 1.39, + "learning_rate": 2.8414000000000003e-05, + "loss": 0.1598, + "step": 14215 + }, + { + "epoch": 1.39, + "learning_rate": 2.8424e-05, + "loss": 0.1348, + "step": 14220 + }, + { + "epoch": 1.39, + "learning_rate": 2.8434e-05, + "loss": 0.1442, + "step": 14225 + }, + { + "epoch": 1.39, + "learning_rate": 2.8444e-05, + "loss": 0.1753, + "step": 14230 + }, + { + "epoch": 1.39, + "learning_rate": 2.8454000000000002e-05, + "loss": 0.1411, + "step": 14235 + }, + { + "epoch": 1.39, + "learning_rate": 2.8464e-05, + "loss": 0.1522, + "step": 14240 + }, + { + "epoch": 1.39, + "learning_rate": 2.8474000000000002e-05, + "loss": 0.1693, + "step": 14245 + }, + { + "epoch": 1.39, + "learning_rate": 2.8484e-05, + "loss": 0.142, + "step": 14250 + }, + { + "epoch": 1.39, + "learning_rate": 2.8494e-05, + "loss": 0.1403, + "step": 14255 + }, + { + "epoch": 1.39, + "learning_rate": 2.8504000000000004e-05, + "loss": 0.1681, + "step": 14260 + }, + { + "epoch": 1.39, + "learning_rate": 2.8514000000000002e-05, + "loss": 0.1804, + "step": 14265 + }, + { + "epoch": 1.4, + "learning_rate": 2.8524e-05, + "loss": 0.141, + "step": 14270 + }, + { + "epoch": 1.4, + "learning_rate": 2.8534e-05, + "loss": 0.1363, + "step": 14275 + }, + { + "epoch": 1.4, + "learning_rate": 2.8544e-05, + "loss": 0.1861, + "step": 14280 + }, + { + "epoch": 1.4, + "learning_rate": 2.8554e-05, + "loss": 0.1589, + "step": 14285 + }, + { + "epoch": 1.4, + "learning_rate": 2.8564000000000003e-05, + "loss": 0.1576, + "step": 14290 + }, + { + "epoch": 1.4, + "learning_rate": 2.8574e-05, + "loss": 0.1605, + "step": 14295 + }, + { + "epoch": 1.4, + "learning_rate": 2.8584e-05, + "loss": 0.1626, + "step": 14300 + }, + { + "epoch": 1.4, + "learning_rate": 2.8594e-05, + "loss": 0.1424, + "step": 14305 + }, + { + "epoch": 1.4, + "learning_rate": 2.8604000000000003e-05, + "loss": 0.1502, + "step": 14310 + }, + { + "epoch": 1.4, + "learning_rate": 2.8614e-05, + "loss": 0.1741, + "step": 14315 + }, + { + "epoch": 1.4, + "learning_rate": 2.8624000000000002e-05, + "loss": 0.1412, + "step": 14320 + }, + { + "epoch": 1.4, + "learning_rate": 2.8634e-05, + "loss": 0.1581, + "step": 14325 + }, + { + "epoch": 1.4, + "learning_rate": 2.8644e-05, + "loss": 0.1888, + "step": 14330 + }, + { + "epoch": 1.4, + "learning_rate": 2.8654e-05, + "loss": 0.1658, + "step": 14335 + }, + { + "epoch": 1.4, + "learning_rate": 2.8664000000000002e-05, + "loss": 0.13, + "step": 14340 + }, + { + "epoch": 1.4, + "learning_rate": 2.8674e-05, + "loss": 0.1724, + "step": 14345 + }, + { + "epoch": 1.4, + "learning_rate": 2.8684e-05, + "loss": 0.1438, + "step": 14350 + }, + { + "epoch": 1.4, + "learning_rate": 2.8694e-05, + "loss": 0.1603, + "step": 14355 + }, + { + "epoch": 1.4, + "learning_rate": 2.8704e-05, + "loss": 0.1603, + "step": 14360 + }, + { + "epoch": 1.4, + "learning_rate": 2.8714e-05, + "loss": 0.1664, + "step": 14365 + }, + { + "epoch": 1.41, + "learning_rate": 2.8724e-05, + "loss": 0.1476, + "step": 14370 + }, + { + "epoch": 1.41, + "learning_rate": 2.8734e-05, + "loss": 0.1401, + "step": 14375 + }, + { + "epoch": 1.41, + "learning_rate": 2.8743999999999998e-05, + "loss": 0.1746, + "step": 14380 + }, + { + "epoch": 1.41, + "learning_rate": 2.8754000000000003e-05, + "loss": 0.1542, + "step": 14385 + }, + { + "epoch": 1.41, + "learning_rate": 2.8764e-05, + "loss": 0.1467, + "step": 14390 + }, + { + "epoch": 1.41, + "learning_rate": 2.8774e-05, + "loss": 0.1716, + "step": 14395 + }, + { + "epoch": 1.41, + "learning_rate": 2.8784e-05, + "loss": 0.1509, + "step": 14400 + }, + { + "epoch": 1.41, + "learning_rate": 2.8794e-05, + "loss": 0.1433, + "step": 14405 + }, + { + "epoch": 1.41, + "learning_rate": 2.8804e-05, + "loss": 0.1516, + "step": 14410 + }, + { + "epoch": 1.41, + "learning_rate": 2.8814000000000002e-05, + "loss": 0.161, + "step": 14415 + }, + { + "epoch": 1.41, + "learning_rate": 2.8824e-05, + "loss": 0.1332, + "step": 14420 + }, + { + "epoch": 1.41, + "learning_rate": 2.8834e-05, + "loss": 0.1467, + "step": 14425 + }, + { + "epoch": 1.41, + "learning_rate": 2.8844e-05, + "loss": 0.163, + "step": 14430 + }, + { + "epoch": 1.41, + "learning_rate": 2.8854000000000002e-05, + "loss": 0.1318, + "step": 14435 + }, + { + "epoch": 1.41, + "learning_rate": 2.8864e-05, + "loss": 0.1471, + "step": 14440 + }, + { + "epoch": 1.41, + "learning_rate": 2.8874000000000002e-05, + "loss": 0.1919, + "step": 14445 + }, + { + "epoch": 1.41, + "learning_rate": 2.8884e-05, + "loss": 0.1435, + "step": 14450 + }, + { + "epoch": 1.41, + "learning_rate": 2.8893999999999998e-05, + "loss": 0.1389, + "step": 14455 + }, + { + "epoch": 1.41, + "learning_rate": 2.8904000000000003e-05, + "loss": 0.1545, + "step": 14460 + }, + { + "epoch": 1.41, + "learning_rate": 2.8914e-05, + "loss": 0.1569, + "step": 14465 + }, + { + "epoch": 1.41, + "learning_rate": 2.8924e-05, + "loss": 0.1343, + "step": 14470 + }, + { + "epoch": 1.42, + "learning_rate": 2.8934e-05, + "loss": 0.1755, + "step": 14475 + }, + { + "epoch": 1.42, + "learning_rate": 2.8944e-05, + "loss": 0.1767, + "step": 14480 + }, + { + "epoch": 1.42, + "learning_rate": 2.8954e-05, + "loss": 0.1389, + "step": 14485 + }, + { + "epoch": 1.42, + "learning_rate": 2.8964000000000003e-05, + "loss": 0.1236, + "step": 14490 + }, + { + "epoch": 1.42, + "learning_rate": 2.8974e-05, + "loss": 0.1659, + "step": 14495 + }, + { + "epoch": 1.42, + "learning_rate": 2.8984e-05, + "loss": 0.1528, + "step": 14500 + }, + { + "epoch": 1.42, + "eval_cer": 0.06733283850246606, + "eval_loss": 0.27808916568756104, + "eval_runtime": 273.3925, + "eval_samples_per_second": 59.877, + "eval_steps_per_second": 1.664, + "eval_wer": 0.17540468712249335, + "step": 14500 + }, + { + "epoch": 1.42, + "learning_rate": 2.8994e-05, + "loss": 0.1396, + "step": 14505 + }, + { + "epoch": 1.42, + "learning_rate": 2.9004000000000002e-05, + "loss": 0.1703, + "step": 14510 + }, + { + "epoch": 1.42, + "learning_rate": 2.9014e-05, + "loss": 0.1696, + "step": 14515 + }, + { + "epoch": 1.42, + "learning_rate": 2.9024000000000002e-05, + "loss": 0.1456, + "step": 14520 + }, + { + "epoch": 1.42, + "learning_rate": 2.9034e-05, + "loss": 0.1375, + "step": 14525 + }, + { + "epoch": 1.42, + "learning_rate": 2.9044e-05, + "loss": 0.1742, + "step": 14530 + }, + { + "epoch": 1.42, + "learning_rate": 2.9054e-05, + "loss": 0.1489, + "step": 14535 + }, + { + "epoch": 1.42, + "learning_rate": 2.9064e-05, + "loss": 0.1421, + "step": 14540 + }, + { + "epoch": 1.42, + "learning_rate": 2.9074e-05, + "loss": 0.173, + "step": 14545 + }, + { + "epoch": 1.42, + "learning_rate": 2.9084e-05, + "loss": 0.1506, + "step": 14550 + }, + { + "epoch": 1.42, + "learning_rate": 2.9094e-05, + "loss": 0.1431, + "step": 14555 + }, + { + "epoch": 1.42, + "learning_rate": 2.9103999999999998e-05, + "loss": 0.1586, + "step": 14560 + }, + { + "epoch": 1.42, + "learning_rate": 2.9114000000000003e-05, + "loss": 0.1825, + "step": 14565 + }, + { + "epoch": 1.42, + "learning_rate": 2.9124e-05, + "loss": 0.131, + "step": 14570 + }, + { + "epoch": 1.43, + "learning_rate": 2.9134e-05, + "loss": 0.1515, + "step": 14575 + }, + { + "epoch": 1.43, + "learning_rate": 2.9144e-05, + "loss": 0.1654, + "step": 14580 + }, + { + "epoch": 1.43, + "learning_rate": 2.9154e-05, + "loss": 0.1481, + "step": 14585 + }, + { + "epoch": 1.43, + "learning_rate": 2.9164e-05, + "loss": 0.1399, + "step": 14590 + }, + { + "epoch": 1.43, + "learning_rate": 2.9174000000000002e-05, + "loss": 0.1867, + "step": 14595 + }, + { + "epoch": 1.43, + "learning_rate": 2.9184e-05, + "loss": 0.152, + "step": 14600 + }, + { + "epoch": 1.43, + "learning_rate": 2.9194e-05, + "loss": 0.1499, + "step": 14605 + }, + { + "epoch": 1.43, + "learning_rate": 2.9204e-05, + "loss": 0.156, + "step": 14610 + }, + { + "epoch": 1.43, + "learning_rate": 2.9214000000000002e-05, + "loss": 0.1916, + "step": 14615 + }, + { + "epoch": 1.43, + "learning_rate": 2.9224e-05, + "loss": 0.144, + "step": 14620 + }, + { + "epoch": 1.43, + "learning_rate": 2.9234e-05, + "loss": 0.1389, + "step": 14625 + }, + { + "epoch": 1.43, + "learning_rate": 2.9244e-05, + "loss": 0.1747, + "step": 14630 + }, + { + "epoch": 1.43, + "learning_rate": 2.9253999999999998e-05, + "loss": 0.1525, + "step": 14635 + }, + { + "epoch": 1.43, + "learning_rate": 2.9264000000000003e-05, + "loss": 0.1352, + "step": 14640 + }, + { + "epoch": 1.43, + "learning_rate": 2.9274e-05, + "loss": 0.1637, + "step": 14645 + }, + { + "epoch": 1.43, + "learning_rate": 2.9284e-05, + "loss": 0.1543, + "step": 14650 + }, + { + "epoch": 1.43, + "learning_rate": 2.9294e-05, + "loss": 0.1464, + "step": 14655 + }, + { + "epoch": 1.43, + "learning_rate": 2.9304e-05, + "loss": 0.153, + "step": 14660 + }, + { + "epoch": 1.43, + "learning_rate": 2.9314e-05, + "loss": 0.1607, + "step": 14665 + }, + { + "epoch": 1.43, + "learning_rate": 2.9324000000000002e-05, + "loss": 0.1547, + "step": 14670 + }, + { + "epoch": 1.43, + "learning_rate": 2.9334e-05, + "loss": 0.1307, + "step": 14675 + }, + { + "epoch": 1.44, + "learning_rate": 2.9344e-05, + "loss": 0.1829, + "step": 14680 + }, + { + "epoch": 1.44, + "learning_rate": 2.9354e-05, + "loss": 0.1475, + "step": 14685 + }, + { + "epoch": 1.44, + "learning_rate": 2.9364000000000002e-05, + "loss": 0.1521, + "step": 14690 + }, + { + "epoch": 1.44, + "learning_rate": 2.9374e-05, + "loss": 0.1816, + "step": 14695 + }, + { + "epoch": 1.44, + "learning_rate": 2.9384000000000002e-05, + "loss": 0.1651, + "step": 14700 + }, + { + "epoch": 1.44, + "learning_rate": 2.9394e-05, + "loss": 0.1325, + "step": 14705 + }, + { + "epoch": 1.44, + "learning_rate": 2.9404e-05, + "loss": 0.1618, + "step": 14710 + }, + { + "epoch": 1.44, + "learning_rate": 2.9414000000000003e-05, + "loss": 0.1855, + "step": 14715 + }, + { + "epoch": 1.44, + "learning_rate": 2.9424e-05, + "loss": 0.1466, + "step": 14720 + }, + { + "epoch": 1.44, + "learning_rate": 2.9434e-05, + "loss": 0.1346, + "step": 14725 + }, + { + "epoch": 1.44, + "learning_rate": 2.9444e-05, + "loss": 0.1704, + "step": 14730 + }, + { + "epoch": 1.44, + "learning_rate": 2.9454e-05, + "loss": 0.138, + "step": 14735 + }, + { + "epoch": 1.44, + "learning_rate": 2.9464e-05, + "loss": 0.1434, + "step": 14740 + }, + { + "epoch": 1.44, + "learning_rate": 2.9474000000000003e-05, + "loss": 0.1888, + "step": 14745 + }, + { + "epoch": 1.44, + "learning_rate": 2.9484e-05, + "loss": 0.1491, + "step": 14750 + }, + { + "epoch": 1.44, + "learning_rate": 2.9494e-05, + "loss": 0.1414, + "step": 14755 + }, + { + "epoch": 1.44, + "learning_rate": 2.9504e-05, + "loss": 0.1739, + "step": 14760 + }, + { + "epoch": 1.44, + "learning_rate": 2.9514000000000002e-05, + "loss": 0.1649, + "step": 14765 + }, + { + "epoch": 1.44, + "learning_rate": 2.9524e-05, + "loss": 0.1484, + "step": 14770 + }, + { + "epoch": 1.44, + "learning_rate": 2.9534000000000002e-05, + "loss": 0.151, + "step": 14775 + }, + { + "epoch": 1.45, + "learning_rate": 2.9544e-05, + "loss": 0.1807, + "step": 14780 + }, + { + "epoch": 1.45, + "learning_rate": 2.9554e-05, + "loss": 0.1534, + "step": 14785 + }, + { + "epoch": 1.45, + "learning_rate": 2.9564000000000004e-05, + "loss": 0.1562, + "step": 14790 + }, + { + "epoch": 1.45, + "learning_rate": 2.9574000000000002e-05, + "loss": 0.1796, + "step": 14795 + }, + { + "epoch": 1.45, + "learning_rate": 2.9584e-05, + "loss": 0.1499, + "step": 14800 + }, + { + "epoch": 1.45, + "learning_rate": 2.9594e-05, + "loss": 0.1391, + "step": 14805 + }, + { + "epoch": 1.45, + "learning_rate": 2.9604e-05, + "loss": 0.1459, + "step": 14810 + }, + { + "epoch": 1.45, + "learning_rate": 2.9614e-05, + "loss": 0.1435, + "step": 14815 + }, + { + "epoch": 1.45, + "learning_rate": 2.9624000000000003e-05, + "loss": 0.1531, + "step": 14820 + }, + { + "epoch": 1.45, + "learning_rate": 2.9634e-05, + "loss": 0.1513, + "step": 14825 + }, + { + "epoch": 1.45, + "learning_rate": 2.9644e-05, + "loss": 0.1868, + "step": 14830 + }, + { + "epoch": 1.45, + "learning_rate": 2.9654e-05, + "loss": 0.1649, + "step": 14835 + }, + { + "epoch": 1.45, + "learning_rate": 2.9664000000000003e-05, + "loss": 0.1323, + "step": 14840 + }, + { + "epoch": 1.45, + "learning_rate": 2.9674e-05, + "loss": 0.1756, + "step": 14845 + }, + { + "epoch": 1.45, + "learning_rate": 2.9684000000000002e-05, + "loss": 0.1422, + "step": 14850 + }, + { + "epoch": 1.45, + "learning_rate": 2.9694e-05, + "loss": 0.1646, + "step": 14855 + }, + { + "epoch": 1.45, + "learning_rate": 2.9704e-05, + "loss": 0.1812, + "step": 14860 + }, + { + "epoch": 1.45, + "learning_rate": 2.9714000000000004e-05, + "loss": 0.1678, + "step": 14865 + }, + { + "epoch": 1.45, + "learning_rate": 2.9724000000000002e-05, + "loss": 0.1511, + "step": 14870 + }, + { + "epoch": 1.45, + "learning_rate": 2.9734e-05, + "loss": 0.1389, + "step": 14875 + }, + { + "epoch": 1.46, + "learning_rate": 2.9744000000000002e-05, + "loss": 0.1858, + "step": 14880 + }, + { + "epoch": 1.46, + "learning_rate": 2.9754e-05, + "loss": 0.1601, + "step": 14885 + }, + { + "epoch": 1.46, + "learning_rate": 2.9764e-05, + "loss": 0.134, + "step": 14890 + }, + { + "epoch": 1.46, + "learning_rate": 2.9774000000000003e-05, + "loss": 0.1932, + "step": 14895 + }, + { + "epoch": 1.46, + "learning_rate": 2.9784e-05, + "loss": 0.1445, + "step": 14900 + }, + { + "epoch": 1.46, + "learning_rate": 2.9794e-05, + "loss": 0.1426, + "step": 14905 + }, + { + "epoch": 1.46, + "learning_rate": 2.9804e-05, + "loss": 0.1724, + "step": 14910 + }, + { + "epoch": 1.46, + "learning_rate": 2.9814000000000003e-05, + "loss": 0.1879, + "step": 14915 + }, + { + "epoch": 1.46, + "learning_rate": 2.9824e-05, + "loss": 0.1326, + "step": 14920 + }, + { + "epoch": 1.46, + "learning_rate": 2.9834000000000003e-05, + "loss": 0.1642, + "step": 14925 + }, + { + "epoch": 1.46, + "learning_rate": 2.9844e-05, + "loss": 0.1976, + "step": 14930 + }, + { + "epoch": 1.46, + "learning_rate": 2.9854e-05, + "loss": 0.1401, + "step": 14935 + }, + { + "epoch": 1.46, + "learning_rate": 2.9864000000000004e-05, + "loss": 0.1401, + "step": 14940 + }, + { + "epoch": 1.46, + "learning_rate": 2.9874000000000002e-05, + "loss": 0.1857, + "step": 14945 + }, + { + "epoch": 1.46, + "learning_rate": 2.9884e-05, + "loss": 0.1623, + "step": 14950 + }, + { + "epoch": 1.46, + "learning_rate": 2.9894e-05, + "loss": 0.1315, + "step": 14955 + }, + { + "epoch": 1.46, + "learning_rate": 2.9904e-05, + "loss": 0.1657, + "step": 14960 + }, + { + "epoch": 1.46, + "learning_rate": 2.9914000000000002e-05, + "loss": 0.153, + "step": 14965 + }, + { + "epoch": 1.46, + "learning_rate": 2.9924e-05, + "loss": 0.1583, + "step": 14970 + }, + { + "epoch": 1.46, + "learning_rate": 2.9934000000000002e-05, + "loss": 0.1567, + "step": 14975 + }, + { + "epoch": 1.46, + "learning_rate": 2.9944e-05, + "loss": 0.1722, + "step": 14980 + }, + { + "epoch": 1.47, + "learning_rate": 2.9953999999999998e-05, + "loss": 0.1458, + "step": 14985 + }, + { + "epoch": 1.47, + "learning_rate": 2.9964e-05, + "loss": 0.156, + "step": 14990 + }, + { + "epoch": 1.47, + "learning_rate": 2.9974e-05, + "loss": 0.191, + "step": 14995 + }, + { + "epoch": 1.47, + "learning_rate": 2.9984e-05, + "loss": 0.153, + "step": 15000 + }, + { + "epoch": 1.47, + "eval_cer": 0.06922082636754834, + "eval_loss": 0.28999707102775574, + "eval_runtime": 272.2934, + "eval_samples_per_second": 60.119, + "eval_steps_per_second": 1.671, + "eval_wer": 0.1788002063430911, + "step": 15000 + }, + { + "epoch": 1.47, + "learning_rate": 2.9994e-05, + "loss": 0.1452, + "step": 15005 + }, + { + "epoch": 1.47, + "learning_rate": 2.9998339330196513e-05, + "loss": 0.175, + "step": 15010 + }, + { + "epoch": 1.47, + "learning_rate": 2.9994187655687794e-05, + "loss": 0.164, + "step": 15015 + }, + { + "epoch": 1.47, + "learning_rate": 2.9990035981179075e-05, + "loss": 0.1493, + "step": 15020 + }, + { + "epoch": 1.47, + "learning_rate": 2.998588430667036e-05, + "loss": 0.1389, + "step": 15025 + }, + { + "epoch": 1.47, + "learning_rate": 2.998173263216164e-05, + "loss": 0.1974, + "step": 15030 + }, + { + "epoch": 1.47, + "learning_rate": 2.997758095765292e-05, + "loss": 0.1495, + "step": 15035 + }, + { + "epoch": 1.47, + "learning_rate": 2.99734292831442e-05, + "loss": 0.1297, + "step": 15040 + }, + { + "epoch": 1.47, + "learning_rate": 2.9969277608635485e-05, + "loss": 0.1576, + "step": 15045 + }, + { + "epoch": 1.47, + "learning_rate": 2.9965125934126766e-05, + "loss": 0.1477, + "step": 15050 + }, + { + "epoch": 1.47, + "learning_rate": 2.9960974259618047e-05, + "loss": 0.1238, + "step": 15055 + }, + { + "epoch": 1.47, + "learning_rate": 2.9956822585109328e-05, + "loss": 0.157, + "step": 15060 + }, + { + "epoch": 1.47, + "learning_rate": 2.9952670910600608e-05, + "loss": 0.1651, + "step": 15065 + }, + { + "epoch": 1.47, + "learning_rate": 2.9948519236091892e-05, + "loss": 0.141, + "step": 15070 + }, + { + "epoch": 1.47, + "learning_rate": 2.9944367561583173e-05, + "loss": 0.1567, + "step": 15075 + }, + { + "epoch": 1.47, + "learning_rate": 2.9940215887074454e-05, + "loss": 0.1597, + "step": 15080 + }, + { + "epoch": 1.48, + "learning_rate": 2.9936064212565735e-05, + "loss": 0.1598, + "step": 15085 + }, + { + "epoch": 1.48, + "learning_rate": 2.9931912538057016e-05, + "loss": 0.1344, + "step": 15090 + }, + { + "epoch": 1.48, + "learning_rate": 2.99277608635483e-05, + "loss": 0.1807, + "step": 15095 + }, + { + "epoch": 1.48, + "learning_rate": 2.992360918903958e-05, + "loss": 0.1618, + "step": 15100 + }, + { + "epoch": 1.48, + "learning_rate": 2.991945751453086e-05, + "loss": 0.1483, + "step": 15105 + }, + { + "epoch": 1.48, + "learning_rate": 2.9915305840022145e-05, + "loss": 0.1552, + "step": 15110 + }, + { + "epoch": 1.48, + "learning_rate": 2.9911154165513426e-05, + "loss": 0.166, + "step": 15115 + }, + { + "epoch": 1.48, + "learning_rate": 2.9907002491004707e-05, + "loss": 0.1486, + "step": 15120 + }, + { + "epoch": 1.48, + "learning_rate": 2.9902850816495988e-05, + "loss": 0.1467, + "step": 15125 + }, + { + "epoch": 1.48, + "learning_rate": 2.989869914198727e-05, + "loss": 0.1759, + "step": 15130 + }, + { + "epoch": 1.48, + "learning_rate": 2.989454746747855e-05, + "loss": 0.1413, + "step": 15135 + }, + { + "epoch": 1.48, + "learning_rate": 2.989039579296983e-05, + "loss": 0.1407, + "step": 15140 + }, + { + "epoch": 1.48, + "learning_rate": 2.988624411846111e-05, + "loss": 0.1856, + "step": 15145 + }, + { + "epoch": 1.48, + "learning_rate": 2.9882092443952395e-05, + "loss": 0.1257, + "step": 15150 + }, + { + "epoch": 1.48, + "learning_rate": 2.987794076944368e-05, + "loss": 0.1603, + "step": 15155 + }, + { + "epoch": 1.48, + "learning_rate": 2.987378909493496e-05, + "loss": 0.1443, + "step": 15160 + }, + { + "epoch": 1.48, + "learning_rate": 2.986963742042624e-05, + "loss": 0.1831, + "step": 15165 + }, + { + "epoch": 1.48, + "learning_rate": 2.986548574591752e-05, + "loss": 0.148, + "step": 15170 + }, + { + "epoch": 1.48, + "learning_rate": 2.9861334071408802e-05, + "loss": 0.1578, + "step": 15175 + }, + { + "epoch": 1.48, + "learning_rate": 2.9857182396900083e-05, + "loss": 0.1846, + "step": 15180 + }, + { + "epoch": 1.48, + "learning_rate": 2.9853030722391364e-05, + "loss": 0.1588, + "step": 15185 + }, + { + "epoch": 1.49, + "learning_rate": 2.9848879047882644e-05, + "loss": 0.1416, + "step": 15190 + }, + { + "epoch": 1.49, + "learning_rate": 2.9844727373373925e-05, + "loss": 0.1956, + "step": 15195 + }, + { + "epoch": 1.49, + "learning_rate": 2.9840575698865213e-05, + "loss": 0.1619, + "step": 15200 + }, + { + "epoch": 1.49, + "learning_rate": 2.9836424024356494e-05, + "loss": 0.1523, + "step": 15205 + }, + { + "epoch": 1.49, + "learning_rate": 2.9832272349847774e-05, + "loss": 0.1521, + "step": 15210 + }, + { + "epoch": 1.49, + "learning_rate": 2.9828120675339055e-05, + "loss": 0.1636, + "step": 15215 + }, + { + "epoch": 1.49, + "learning_rate": 2.9823969000830336e-05, + "loss": 0.1431, + "step": 15220 + }, + { + "epoch": 1.49, + "learning_rate": 2.9819817326321617e-05, + "loss": 0.1511, + "step": 15225 + }, + { + "epoch": 1.49, + "learning_rate": 2.9815665651812897e-05, + "loss": 0.1715, + "step": 15230 + }, + { + "epoch": 1.49, + "learning_rate": 2.9811513977304178e-05, + "loss": 0.146, + "step": 15235 + }, + { + "epoch": 1.49, + "learning_rate": 2.980736230279546e-05, + "loss": 0.1498, + "step": 15240 + }, + { + "epoch": 1.49, + "learning_rate": 2.9803210628286743e-05, + "loss": 0.1747, + "step": 15245 + }, + { + "epoch": 1.49, + "learning_rate": 2.9799058953778027e-05, + "loss": 0.1438, + "step": 15250 + }, + { + "epoch": 1.49, + "learning_rate": 2.9794907279269308e-05, + "loss": 0.1324, + "step": 15255 + }, + { + "epoch": 1.49, + "learning_rate": 2.979075560476059e-05, + "loss": 0.1686, + "step": 15260 + }, + { + "epoch": 1.49, + "learning_rate": 2.978660393025187e-05, + "loss": 0.16, + "step": 15265 + }, + { + "epoch": 1.49, + "learning_rate": 2.978245225574315e-05, + "loss": 0.1511, + "step": 15270 + }, + { + "epoch": 1.49, + "learning_rate": 2.977830058123443e-05, + "loss": 0.1375, + "step": 15275 + }, + { + "epoch": 1.49, + "learning_rate": 2.9774148906725712e-05, + "loss": 0.1872, + "step": 15280 + }, + { + "epoch": 1.49, + "learning_rate": 2.9769997232216993e-05, + "loss": 0.1422, + "step": 15285 + }, + { + "epoch": 1.5, + "learning_rate": 2.9765845557708277e-05, + "loss": 0.1385, + "step": 15290 + }, + { + "epoch": 1.5, + "learning_rate": 2.9761693883199558e-05, + "loss": 0.1528, + "step": 15295 + }, + { + "epoch": 1.5, + "learning_rate": 2.9757542208690838e-05, + "loss": 0.1469, + "step": 15300 + }, + { + "epoch": 1.5, + "learning_rate": 2.9753390534182122e-05, + "loss": 0.1474, + "step": 15305 + }, + { + "epoch": 1.5, + "learning_rate": 2.9749238859673403e-05, + "loss": 0.1435, + "step": 15310 + }, + { + "epoch": 1.5, + "learning_rate": 2.9745087185164684e-05, + "loss": 0.1697, + "step": 15315 + }, + { + "epoch": 1.5, + "learning_rate": 2.9740935510655965e-05, + "loss": 0.1479, + "step": 15320 + }, + { + "epoch": 1.5, + "learning_rate": 2.9736783836147246e-05, + "loss": 0.1394, + "step": 15325 + }, + { + "epoch": 1.5, + "learning_rate": 2.973263216163853e-05, + "loss": 0.1673, + "step": 15330 + }, + { + "epoch": 1.5, + "learning_rate": 2.972848048712981e-05, + "loss": 0.1555, + "step": 15335 + }, + { + "epoch": 1.5, + "learning_rate": 2.972432881262109e-05, + "loss": 0.1361, + "step": 15340 + }, + { + "epoch": 1.5, + "learning_rate": 2.9720177138112372e-05, + "loss": 0.166, + "step": 15345 + }, + { + "epoch": 1.5, + "learning_rate": 2.9716025463603653e-05, + "loss": 0.1685, + "step": 15350 + }, + { + "epoch": 1.5, + "learning_rate": 2.9711873789094937e-05, + "loss": 0.1549, + "step": 15355 + }, + { + "epoch": 1.5, + "learning_rate": 2.9707722114586218e-05, + "loss": 0.1594, + "step": 15360 + }, + { + "epoch": 1.5, + "learning_rate": 2.97035704400775e-05, + "loss": 0.1658, + "step": 15365 + }, + { + "epoch": 1.5, + "learning_rate": 2.969941876556878e-05, + "loss": 0.1409, + "step": 15370 + }, + { + "epoch": 1.5, + "learning_rate": 2.9695267091060063e-05, + "loss": 0.1527, + "step": 15375 + }, + { + "epoch": 1.5, + "learning_rate": 2.9691115416551344e-05, + "loss": 0.1852, + "step": 15380 + }, + { + "epoch": 1.5, + "learning_rate": 2.9686963742042625e-05, + "loss": 0.1414, + "step": 15385 + }, + { + "epoch": 1.5, + "learning_rate": 2.9682812067533906e-05, + "loss": 0.1485, + "step": 15390 + }, + { + "epoch": 1.51, + "learning_rate": 2.9678660393025186e-05, + "loss": 0.1679, + "step": 15395 + }, + { + "epoch": 1.51, + "learning_rate": 2.9674508718516467e-05, + "loss": 0.162, + "step": 15400 + }, + { + "epoch": 1.51, + "learning_rate": 2.967035704400775e-05, + "loss": 0.149, + "step": 15405 + }, + { + "epoch": 1.51, + "learning_rate": 2.9666205369499032e-05, + "loss": 0.1605, + "step": 15410 + }, + { + "epoch": 1.51, + "learning_rate": 2.9662053694990313e-05, + "loss": 0.1565, + "step": 15415 + }, + { + "epoch": 1.51, + "learning_rate": 2.9657902020481597e-05, + "loss": 0.1441, + "step": 15420 + }, + { + "epoch": 1.51, + "learning_rate": 2.9653750345972878e-05, + "loss": 0.1807, + "step": 15425 + }, + { + "epoch": 1.51, + "learning_rate": 2.964959867146416e-05, + "loss": 0.1919, + "step": 15430 + }, + { + "epoch": 1.51, + "learning_rate": 2.964544699695544e-05, + "loss": 0.1477, + "step": 15435 + }, + { + "epoch": 1.51, + "learning_rate": 2.964129532244672e-05, + "loss": 0.1534, + "step": 15440 + }, + { + "epoch": 1.51, + "learning_rate": 2.9637143647938e-05, + "loss": 0.1544, + "step": 15445 + }, + { + "epoch": 1.51, + "learning_rate": 2.963299197342928e-05, + "loss": 0.1537, + "step": 15450 + }, + { + "epoch": 1.51, + "learning_rate": 2.9628840298920566e-05, + "loss": 0.1762, + "step": 15455 + }, + { + "epoch": 1.51, + "learning_rate": 2.9624688624411847e-05, + "loss": 0.1652, + "step": 15460 + }, + { + "epoch": 1.51, + "learning_rate": 2.962053694990313e-05, + "loss": 0.1594, + "step": 15465 + }, + { + "epoch": 1.51, + "learning_rate": 2.961638527539441e-05, + "loss": 0.1481, + "step": 15470 + }, + { + "epoch": 1.51, + "learning_rate": 2.9612233600885692e-05, + "loss": 0.1454, + "step": 15475 + }, + { + "epoch": 1.51, + "learning_rate": 2.9608081926376973e-05, + "loss": 0.1715, + "step": 15480 + }, + { + "epoch": 1.51, + "learning_rate": 2.9603930251868254e-05, + "loss": 0.1441, + "step": 15485 + }, + { + "epoch": 1.51, + "learning_rate": 2.9599778577359535e-05, + "loss": 0.1399, + "step": 15490 + }, + { + "epoch": 1.52, + "learning_rate": 2.9595626902850815e-05, + "loss": 0.1594, + "step": 15495 + }, + { + "epoch": 1.52, + "learning_rate": 2.9591475228342096e-05, + "loss": 0.1575, + "step": 15500 + }, + { + "epoch": 1.52, + "eval_cer": 0.06704611407470096, + "eval_loss": 0.2713145911693573, + "eval_runtime": 275.3189, + "eval_samples_per_second": 59.458, + "eval_steps_per_second": 1.653, + "eval_wer": 0.1757638285785181, + "step": 15500 + }, + { + "epoch": 1.52, + "learning_rate": 2.958732355383338e-05, + "loss": 0.1305, + "step": 15505 + }, + { + "epoch": 1.52, + "learning_rate": 2.9583171879324664e-05, + "loss": 0.1535, + "step": 15510 + }, + { + "epoch": 1.52, + "learning_rate": 2.9579020204815945e-05, + "loss": 0.1568, + "step": 15515 + }, + { + "epoch": 1.52, + "learning_rate": 2.9574868530307226e-05, + "loss": 0.1486, + "step": 15520 + }, + { + "epoch": 1.52, + "learning_rate": 2.9570716855798507e-05, + "loss": 0.145, + "step": 15525 + }, + { + "epoch": 1.52, + "learning_rate": 2.9566565181289788e-05, + "loss": 0.153, + "step": 15530 + }, + { + "epoch": 1.52, + "learning_rate": 2.9562413506781068e-05, + "loss": 0.1376, + "step": 15535 + }, + { + "epoch": 1.52, + "learning_rate": 2.955826183227235e-05, + "loss": 0.1385, + "step": 15540 + }, + { + "epoch": 1.52, + "learning_rate": 2.955411015776363e-05, + "loss": 0.1844, + "step": 15545 + }, + { + "epoch": 1.52, + "learning_rate": 2.9549958483254914e-05, + "loss": 0.159, + "step": 15550 + }, + { + "epoch": 1.52, + "learning_rate": 2.9545806808746195e-05, + "loss": 0.1428, + "step": 15555 + }, + { + "epoch": 1.52, + "learning_rate": 2.954165513423748e-05, + "loss": 0.1478, + "step": 15560 + }, + { + "epoch": 1.52, + "learning_rate": 2.953750345972876e-05, + "loss": 0.1684, + "step": 15565 + }, + { + "epoch": 1.52, + "learning_rate": 2.953335178522004e-05, + "loss": 0.1319, + "step": 15570 + }, + { + "epoch": 1.52, + "learning_rate": 2.952920011071132e-05, + "loss": 0.1571, + "step": 15575 + }, + { + "epoch": 1.52, + "learning_rate": 2.9525048436202602e-05, + "loss": 0.1598, + "step": 15580 + }, + { + "epoch": 1.52, + "learning_rate": 2.9520896761693883e-05, + "loss": 0.1521, + "step": 15585 + }, + { + "epoch": 1.52, + "learning_rate": 2.9516745087185164e-05, + "loss": 0.1465, + "step": 15590 + }, + { + "epoch": 1.52, + "learning_rate": 2.9512593412676448e-05, + "loss": 0.1774, + "step": 15595 + }, + { + "epoch": 1.53, + "learning_rate": 2.950844173816773e-05, + "loss": 0.1397, + "step": 15600 + }, + { + "epoch": 1.53, + "learning_rate": 2.950429006365901e-05, + "loss": 0.1552, + "step": 15605 + }, + { + "epoch": 1.53, + "learning_rate": 2.9500138389150293e-05, + "loss": 0.1801, + "step": 15610 + }, + { + "epoch": 1.53, + "learning_rate": 2.9495986714641574e-05, + "loss": 0.1515, + "step": 15615 + }, + { + "epoch": 1.53, + "learning_rate": 2.9491835040132855e-05, + "loss": 0.1284, + "step": 15620 + }, + { + "epoch": 1.53, + "learning_rate": 2.9487683365624136e-05, + "loss": 0.1306, + "step": 15625 + }, + { + "epoch": 1.53, + "learning_rate": 2.9483531691115416e-05, + "loss": 0.1648, + "step": 15630 + }, + { + "epoch": 1.53, + "learning_rate": 2.9479380016606697e-05, + "loss": 0.1287, + "step": 15635 + }, + { + "epoch": 1.53, + "learning_rate": 2.947522834209798e-05, + "loss": 0.1459, + "step": 15640 + }, + { + "epoch": 1.53, + "learning_rate": 2.9471076667589262e-05, + "loss": 0.1612, + "step": 15645 + }, + { + "epoch": 1.53, + "learning_rate": 2.9466924993080543e-05, + "loss": 0.1334, + "step": 15650 + }, + { + "epoch": 1.53, + "learning_rate": 2.9462773318571824e-05, + "loss": 0.138, + "step": 15655 + }, + { + "epoch": 1.53, + "learning_rate": 2.9458621644063108e-05, + "loss": 0.1802, + "step": 15660 + }, + { + "epoch": 1.53, + "learning_rate": 2.945446996955439e-05, + "loss": 0.1666, + "step": 15665 + }, + { + "epoch": 1.53, + "learning_rate": 2.945031829504567e-05, + "loss": 0.1407, + "step": 15670 + }, + { + "epoch": 1.53, + "learning_rate": 2.944616662053695e-05, + "loss": 0.1402, + "step": 15675 + }, + { + "epoch": 1.53, + "learning_rate": 2.944201494602823e-05, + "loss": 0.1872, + "step": 15680 + }, + { + "epoch": 1.53, + "learning_rate": 2.9437863271519515e-05, + "loss": 0.1489, + "step": 15685 + }, + { + "epoch": 1.53, + "learning_rate": 2.9433711597010796e-05, + "loss": 0.1587, + "step": 15690 + }, + { + "epoch": 1.53, + "learning_rate": 2.9429559922502077e-05, + "loss": 0.1618, + "step": 15695 + }, + { + "epoch": 1.54, + "learning_rate": 2.9425408247993357e-05, + "loss": 0.1359, + "step": 15700 + }, + { + "epoch": 1.54, + "learning_rate": 2.9421256573484638e-05, + "loss": 0.1301, + "step": 15705 + }, + { + "epoch": 1.54, + "learning_rate": 2.9417104898975922e-05, + "loss": 0.1309, + "step": 15710 + }, + { + "epoch": 1.54, + "learning_rate": 2.9412953224467203e-05, + "loss": 0.1611, + "step": 15715 + }, + { + "epoch": 1.54, + "learning_rate": 2.9408801549958484e-05, + "loss": 0.147, + "step": 15720 + }, + { + "epoch": 1.54, + "learning_rate": 2.9404649875449765e-05, + "loss": 0.1471, + "step": 15725 + }, + { + "epoch": 1.54, + "learning_rate": 2.940049820094105e-05, + "loss": 0.1856, + "step": 15730 + }, + { + "epoch": 1.54, + "learning_rate": 2.939634652643233e-05, + "loss": 0.1308, + "step": 15735 + }, + { + "epoch": 1.54, + "learning_rate": 2.939219485192361e-05, + "loss": 0.1472, + "step": 15740 + }, + { + "epoch": 1.54, + "learning_rate": 2.938804317741489e-05, + "loss": 0.1534, + "step": 15745 + }, + { + "epoch": 1.54, + "learning_rate": 2.9383891502906172e-05, + "loss": 0.1583, + "step": 15750 + }, + { + "epoch": 1.54, + "learning_rate": 2.9379739828397453e-05, + "loss": 0.1408, + "step": 15755 + }, + { + "epoch": 1.54, + "learning_rate": 2.9375588153888733e-05, + "loss": 0.1483, + "step": 15760 + }, + { + "epoch": 1.54, + "learning_rate": 2.9371436479380018e-05, + "loss": 0.1613, + "step": 15765 + }, + { + "epoch": 1.54, + "learning_rate": 2.9367284804871298e-05, + "loss": 0.1777, + "step": 15770 + }, + { + "epoch": 1.54, + "learning_rate": 2.9363133130362582e-05, + "loss": 0.1905, + "step": 15775 + }, + { + "epoch": 1.54, + "learning_rate": 2.9358981455853863e-05, + "loss": 0.1666, + "step": 15780 + }, + { + "epoch": 1.54, + "learning_rate": 2.9354829781345144e-05, + "loss": 0.1406, + "step": 15785 + }, + { + "epoch": 1.54, + "learning_rate": 2.9350678106836425e-05, + "loss": 0.1367, + "step": 15790 + }, + { + "epoch": 1.54, + "learning_rate": 2.9346526432327706e-05, + "loss": 0.1922, + "step": 15795 + }, + { + "epoch": 1.54, + "learning_rate": 2.9342374757818986e-05, + "loss": 0.1534, + "step": 15800 + }, + { + "epoch": 1.55, + "learning_rate": 2.9338223083310267e-05, + "loss": 0.1404, + "step": 15805 + }, + { + "epoch": 1.55, + "learning_rate": 2.9334071408801548e-05, + "loss": 0.1806, + "step": 15810 + }, + { + "epoch": 1.55, + "learning_rate": 2.9329919734292835e-05, + "loss": 0.172, + "step": 15815 + }, + { + "epoch": 1.55, + "learning_rate": 2.9325768059784116e-05, + "loss": 0.1579, + "step": 15820 + }, + { + "epoch": 1.55, + "learning_rate": 2.9321616385275397e-05, + "loss": 0.1533, + "step": 15825 + }, + { + "epoch": 1.55, + "learning_rate": 2.9317464710766678e-05, + "loss": 0.1797, + "step": 15830 + }, + { + "epoch": 1.55, + "learning_rate": 2.931331303625796e-05, + "loss": 0.1347, + "step": 15835 + }, + { + "epoch": 1.55, + "learning_rate": 2.930916136174924e-05, + "loss": 0.1399, + "step": 15840 + }, + { + "epoch": 1.55, + "learning_rate": 2.930500968724052e-05, + "loss": 0.1717, + "step": 15845 + }, + { + "epoch": 1.55, + "learning_rate": 2.93008580127318e-05, + "loss": 0.1461, + "step": 15850 + }, + { + "epoch": 1.55, + "learning_rate": 2.929670633822308e-05, + "loss": 0.134, + "step": 15855 + }, + { + "epoch": 1.55, + "learning_rate": 2.9292554663714366e-05, + "loss": 0.1533, + "step": 15860 + }, + { + "epoch": 1.55, + "learning_rate": 2.928840298920565e-05, + "loss": 0.1812, + "step": 15865 + }, + { + "epoch": 1.55, + "learning_rate": 2.928425131469693e-05, + "loss": 0.1413, + "step": 15870 + }, + { + "epoch": 1.55, + "learning_rate": 2.928009964018821e-05, + "loss": 0.1568, + "step": 15875 + }, + { + "epoch": 1.55, + "learning_rate": 2.9275947965679492e-05, + "loss": 0.2033, + "step": 15880 + }, + { + "epoch": 1.55, + "learning_rate": 2.9271796291170773e-05, + "loss": 0.1375, + "step": 15885 + }, + { + "epoch": 1.55, + "learning_rate": 2.9267644616662054e-05, + "loss": 0.1392, + "step": 15890 + }, + { + "epoch": 1.55, + "learning_rate": 2.9263492942153334e-05, + "loss": 0.1879, + "step": 15895 + }, + { + "epoch": 1.55, + "learning_rate": 2.9259341267644615e-05, + "loss": 0.1499, + "step": 15900 + }, + { + "epoch": 1.56, + "learning_rate": 2.92551895931359e-05, + "loss": 0.1379, + "step": 15905 + }, + { + "epoch": 1.56, + "learning_rate": 2.925103791862718e-05, + "loss": 0.1553, + "step": 15910 + }, + { + "epoch": 1.56, + "learning_rate": 2.924688624411846e-05, + "loss": 0.1732, + "step": 15915 + }, + { + "epoch": 1.56, + "learning_rate": 2.9242734569609745e-05, + "loss": 0.1367, + "step": 15920 + }, + { + "epoch": 1.56, + "learning_rate": 2.9238582895101026e-05, + "loss": 0.1336, + "step": 15925 + }, + { + "epoch": 1.56, + "learning_rate": 2.9234431220592307e-05, + "loss": 0.1682, + "step": 15930 + }, + { + "epoch": 1.56, + "learning_rate": 2.9230279546083587e-05, + "loss": 0.1524, + "step": 15935 + }, + { + "epoch": 1.56, + "learning_rate": 2.9226127871574868e-05, + "loss": 0.1457, + "step": 15940 + }, + { + "epoch": 1.56, + "learning_rate": 2.922197619706615e-05, + "loss": 0.1722, + "step": 15945 + }, + { + "epoch": 1.56, + "learning_rate": 2.9217824522557433e-05, + "loss": 0.1376, + "step": 15950 + }, + { + "epoch": 1.56, + "learning_rate": 2.9213672848048714e-05, + "loss": 0.1363, + "step": 15955 + }, + { + "epoch": 1.56, + "learning_rate": 2.9209521173539995e-05, + "loss": 0.1572, + "step": 15960 + }, + { + "epoch": 1.56, + "learning_rate": 2.9205369499031275e-05, + "loss": 0.1541, + "step": 15965 + }, + { + "epoch": 1.56, + "learning_rate": 2.920121782452256e-05, + "loss": 0.1476, + "step": 15970 + }, + { + "epoch": 1.56, + "learning_rate": 2.919706615001384e-05, + "loss": 0.1544, + "step": 15975 + }, + { + "epoch": 1.56, + "learning_rate": 2.919291447550512e-05, + "loss": 0.1959, + "step": 15980 + }, + { + "epoch": 1.56, + "learning_rate": 2.9188762800996402e-05, + "loss": 0.14, + "step": 15985 + }, + { + "epoch": 1.56, + "learning_rate": 2.9184611126487683e-05, + "loss": 0.1528, + "step": 15990 + }, + { + "epoch": 1.56, + "learning_rate": 2.9180459451978967e-05, + "loss": 0.1617, + "step": 15995 + }, + { + "epoch": 1.56, + "learning_rate": 2.9176307777470248e-05, + "loss": 0.1543, + "step": 16000 + }, + { + "epoch": 1.56, + "eval_cer": 0.06663105734257325, + "eval_loss": 0.2845642864704132, + "eval_runtime": 273.4434, + "eval_samples_per_second": 59.866, + "eval_steps_per_second": 1.664, + "eval_wer": 0.17281886863911508, + "step": 16000 + }, + { + "epoch": 1.57, + "learning_rate": 2.9172156102961528e-05, + "loss": 0.1233, + "step": 16005 + }, + { + "epoch": 1.57, + "learning_rate": 2.916800442845281e-05, + "loss": 0.1463, + "step": 16010 + }, + { + "epoch": 1.57, + "learning_rate": 2.916385275394409e-05, + "loss": 0.1605, + "step": 16015 + }, + { + "epoch": 1.57, + "learning_rate": 2.9159701079435374e-05, + "loss": 0.1398, + "step": 16020 + }, + { + "epoch": 1.57, + "learning_rate": 2.9155549404926655e-05, + "loss": 0.1514, + "step": 16025 + }, + { + "epoch": 1.57, + "learning_rate": 2.9151397730417936e-05, + "loss": 0.1693, + "step": 16030 + }, + { + "epoch": 1.57, + "learning_rate": 2.914724605590922e-05, + "loss": 0.1492, + "step": 16035 + }, + { + "epoch": 1.57, + "learning_rate": 2.91430943814005e-05, + "loss": 0.1492, + "step": 16040 + }, + { + "epoch": 1.57, + "learning_rate": 2.913894270689178e-05, + "loss": 0.1731, + "step": 16045 + }, + { + "epoch": 1.57, + "learning_rate": 2.9134791032383062e-05, + "loss": 0.1417, + "step": 16050 + }, + { + "epoch": 1.57, + "learning_rate": 2.9130639357874343e-05, + "loss": 0.1531, + "step": 16055 + }, + { + "epoch": 1.57, + "learning_rate": 2.9126487683365624e-05, + "loss": 0.1551, + "step": 16060 + }, + { + "epoch": 1.57, + "learning_rate": 2.9122336008856904e-05, + "loss": 0.1515, + "step": 16065 + }, + { + "epoch": 1.57, + "learning_rate": 2.911818433434819e-05, + "loss": 0.1209, + "step": 16070 + }, + { + "epoch": 1.57, + "learning_rate": 2.911403265983947e-05, + "loss": 0.1442, + "step": 16075 + }, + { + "epoch": 1.57, + "learning_rate": 2.9109880985330753e-05, + "loss": 0.1783, + "step": 16080 + }, + { + "epoch": 1.57, + "learning_rate": 2.9105729310822034e-05, + "loss": 0.1299, + "step": 16085 + }, + { + "epoch": 1.57, + "learning_rate": 2.9101577636313315e-05, + "loss": 0.1501, + "step": 16090 + }, + { + "epoch": 1.57, + "learning_rate": 2.9097425961804596e-05, + "loss": 0.1834, + "step": 16095 + }, + { + "epoch": 1.57, + "learning_rate": 2.9093274287295876e-05, + "loss": 0.15, + "step": 16100 + }, + { + "epoch": 1.57, + "learning_rate": 2.9089122612787157e-05, + "loss": 0.1465, + "step": 16105 + }, + { + "epoch": 1.58, + "learning_rate": 2.9084970938278438e-05, + "loss": 0.1836, + "step": 16110 + }, + { + "epoch": 1.58, + "learning_rate": 2.908081926376972e-05, + "loss": 0.1701, + "step": 16115 + }, + { + "epoch": 1.58, + "learning_rate": 2.9076667589261003e-05, + "loss": 0.1409, + "step": 16120 + }, + { + "epoch": 1.58, + "learning_rate": 2.9072515914752287e-05, + "loss": 0.1282, + "step": 16125 + }, + { + "epoch": 1.58, + "learning_rate": 2.9068364240243568e-05, + "loss": 0.1661, + "step": 16130 + }, + { + "epoch": 1.58, + "learning_rate": 2.906421256573485e-05, + "loss": 0.1398, + "step": 16135 + }, + { + "epoch": 1.58, + "learning_rate": 2.906006089122613e-05, + "loss": 0.1585, + "step": 16140 + }, + { + "epoch": 1.58, + "learning_rate": 2.905590921671741e-05, + "loss": 0.1686, + "step": 16145 + }, + { + "epoch": 1.58, + "learning_rate": 2.905175754220869e-05, + "loss": 0.1489, + "step": 16150 + }, + { + "epoch": 1.58, + "learning_rate": 2.904760586769997e-05, + "loss": 0.1229, + "step": 16155 + }, + { + "epoch": 1.58, + "learning_rate": 2.9043454193191252e-05, + "loss": 0.1454, + "step": 16160 + }, + { + "epoch": 1.58, + "learning_rate": 2.9039302518682533e-05, + "loss": 0.1747, + "step": 16165 + }, + { + "epoch": 1.58, + "learning_rate": 2.9035150844173817e-05, + "loss": 0.144, + "step": 16170 + }, + { + "epoch": 1.58, + "learning_rate": 2.90309991696651e-05, + "loss": 0.1574, + "step": 16175 + }, + { + "epoch": 1.58, + "learning_rate": 2.9026847495156382e-05, + "loss": 0.1641, + "step": 16180 + }, + { + "epoch": 1.58, + "learning_rate": 2.9022695820647663e-05, + "loss": 0.1443, + "step": 16185 + }, + { + "epoch": 1.58, + "learning_rate": 2.9018544146138944e-05, + "loss": 0.1341, + "step": 16190 + }, + { + "epoch": 1.58, + "learning_rate": 2.9014392471630225e-05, + "loss": 0.1788, + "step": 16195 + }, + { + "epoch": 1.58, + "learning_rate": 2.9010240797121505e-05, + "loss": 0.1448, + "step": 16200 + }, + { + "epoch": 1.58, + "learning_rate": 2.9006089122612786e-05, + "loss": 0.1426, + "step": 16205 + }, + { + "epoch": 1.59, + "learning_rate": 2.9001937448104067e-05, + "loss": 0.1592, + "step": 16210 + }, + { + "epoch": 1.59, + "learning_rate": 2.899778577359535e-05, + "loss": 0.1666, + "step": 16215 + }, + { + "epoch": 1.59, + "learning_rate": 2.8993634099086632e-05, + "loss": 0.1331, + "step": 16220 + }, + { + "epoch": 1.59, + "learning_rate": 2.8989482424577916e-05, + "loss": 0.1382, + "step": 16225 + }, + { + "epoch": 1.59, + "learning_rate": 2.8985330750069197e-05, + "loss": 0.1688, + "step": 16230 + }, + { + "epoch": 1.59, + "learning_rate": 2.8981179075560478e-05, + "loss": 0.1442, + "step": 16235 + }, + { + "epoch": 1.59, + "learning_rate": 2.8977027401051758e-05, + "loss": 0.1419, + "step": 16240 + }, + { + "epoch": 1.59, + "learning_rate": 2.897287572654304e-05, + "loss": 0.1873, + "step": 16245 + }, + { + "epoch": 1.59, + "learning_rate": 2.896872405203432e-05, + "loss": 0.1655, + "step": 16250 + }, + { + "epoch": 1.59, + "learning_rate": 2.8964572377525604e-05, + "loss": 0.1474, + "step": 16255 + }, + { + "epoch": 1.59, + "learning_rate": 2.8960420703016885e-05, + "loss": 0.1684, + "step": 16260 + }, + { + "epoch": 1.59, + "learning_rate": 2.8956269028508166e-05, + "loss": 0.1637, + "step": 16265 + }, + { + "epoch": 1.59, + "learning_rate": 2.8952117353999446e-05, + "loss": 0.1348, + "step": 16270 + }, + { + "epoch": 1.59, + "learning_rate": 2.894796567949073e-05, + "loss": 0.1425, + "step": 16275 + }, + { + "epoch": 1.59, + "learning_rate": 2.894381400498201e-05, + "loss": 0.1788, + "step": 16280 + }, + { + "epoch": 1.59, + "learning_rate": 2.8939662330473292e-05, + "loss": 0.1332, + "step": 16285 + }, + { + "epoch": 1.59, + "learning_rate": 2.8935510655964573e-05, + "loss": 0.1431, + "step": 16290 + }, + { + "epoch": 1.59, + "learning_rate": 2.8931358981455854e-05, + "loss": 0.1875, + "step": 16295 + }, + { + "epoch": 1.59, + "learning_rate": 2.8927207306947138e-05, + "loss": 0.1399, + "step": 16300 + }, + { + "epoch": 1.59, + "learning_rate": 2.892305563243842e-05, + "loss": 0.1335, + "step": 16305 + }, + { + "epoch": 1.59, + "learning_rate": 2.89189039579297e-05, + "loss": 0.1598, + "step": 16310 + }, + { + "epoch": 1.6, + "learning_rate": 2.891475228342098e-05, + "loss": 0.1439, + "step": 16315 + }, + { + "epoch": 1.6, + "learning_rate": 2.891060060891226e-05, + "loss": 0.1311, + "step": 16320 + }, + { + "epoch": 1.6, + "learning_rate": 2.890644893440354e-05, + "loss": 0.1383, + "step": 16325 + }, + { + "epoch": 1.6, + "learning_rate": 2.8902297259894826e-05, + "loss": 0.1567, + "step": 16330 + }, + { + "epoch": 1.6, + "learning_rate": 2.8898145585386106e-05, + "loss": 0.1443, + "step": 16335 + }, + { + "epoch": 1.6, + "learning_rate": 2.8893993910877387e-05, + "loss": 0.1492, + "step": 16340 + }, + { + "epoch": 1.6, + "learning_rate": 2.888984223636867e-05, + "loss": 0.174, + "step": 16345 + }, + { + "epoch": 1.6, + "learning_rate": 2.8885690561859952e-05, + "loss": 0.139, + "step": 16350 + }, + { + "epoch": 1.6, + "learning_rate": 2.8881538887351233e-05, + "loss": 0.142, + "step": 16355 + }, + { + "epoch": 1.6, + "learning_rate": 2.8877387212842514e-05, + "loss": 0.1729, + "step": 16360 + }, + { + "epoch": 1.6, + "learning_rate": 2.8873235538333794e-05, + "loss": 0.1682, + "step": 16365 + }, + { + "epoch": 1.6, + "learning_rate": 2.8869083863825075e-05, + "loss": 0.1383, + "step": 16370 + }, + { + "epoch": 1.6, + "learning_rate": 2.8865762524218103e-05, + "loss": 0.1504, + "step": 16375 + }, + { + "epoch": 1.6, + "learning_rate": 2.8861610849709384e-05, + "loss": 0.1789, + "step": 16380 + }, + { + "epoch": 1.6, + "learning_rate": 2.8857459175200665e-05, + "loss": 0.1407, + "step": 16385 + }, + { + "epoch": 1.6, + "learning_rate": 2.8853307500691945e-05, + "loss": 0.1332, + "step": 16390 + }, + { + "epoch": 1.6, + "learning_rate": 2.8849155826183226e-05, + "loss": 0.1602, + "step": 16395 + }, + { + "epoch": 1.6, + "learning_rate": 2.884500415167451e-05, + "loss": 0.1569, + "step": 16400 + }, + { + "epoch": 1.6, + "learning_rate": 2.884085247716579e-05, + "loss": 0.1351, + "step": 16405 + }, + { + "epoch": 1.6, + "learning_rate": 2.8836700802657072e-05, + "loss": 0.1492, + "step": 16410 + }, + { + "epoch": 1.61, + "learning_rate": 2.8832549128148356e-05, + "loss": 0.1367, + "step": 16415 + }, + { + "epoch": 1.61, + "learning_rate": 2.8828397453639637e-05, + "loss": 0.1495, + "step": 16420 + }, + { + "epoch": 1.61, + "learning_rate": 2.8824245779130918e-05, + "loss": 0.1403, + "step": 16425 + }, + { + "epoch": 1.61, + "learning_rate": 2.88200941046222e-05, + "loss": 0.1781, + "step": 16430 + }, + { + "epoch": 1.61, + "learning_rate": 2.881594243011348e-05, + "loss": 0.1197, + "step": 16435 + }, + { + "epoch": 1.61, + "learning_rate": 2.881179075560476e-05, + "loss": 0.1475, + "step": 16440 + }, + { + "epoch": 1.61, + "learning_rate": 2.880763908109604e-05, + "loss": 0.1594, + "step": 16445 + }, + { + "epoch": 1.61, + "learning_rate": 2.8803487406587325e-05, + "loss": 0.1455, + "step": 16450 + }, + { + "epoch": 1.61, + "learning_rate": 2.8799335732078606e-05, + "loss": 0.1582, + "step": 16455 + }, + { + "epoch": 1.61, + "learning_rate": 2.879518405756989e-05, + "loss": 0.1882, + "step": 16460 + }, + { + "epoch": 1.61, + "learning_rate": 2.879103238306117e-05, + "loss": 0.1692, + "step": 16465 + }, + { + "epoch": 1.61, + "learning_rate": 2.878688070855245e-05, + "loss": 0.1389, + "step": 16470 + }, + { + "epoch": 1.61, + "learning_rate": 2.8782729034043732e-05, + "loss": 0.169, + "step": 16475 + }, + { + "epoch": 1.61, + "learning_rate": 2.8778577359535013e-05, + "loss": 0.1674, + "step": 16480 + }, + { + "epoch": 1.61, + "learning_rate": 2.8774425685026294e-05, + "loss": 0.1476, + "step": 16485 + }, + { + "epoch": 1.61, + "learning_rate": 2.8770274010517574e-05, + "loss": 0.1465, + "step": 16490 + }, + { + "epoch": 1.61, + "learning_rate": 2.8766122336008855e-05, + "loss": 0.1705, + "step": 16495 + }, + { + "epoch": 1.61, + "learning_rate": 2.876197066150014e-05, + "loss": 0.1354, + "step": 16500 + }, + { + "epoch": 1.61, + "eval_cer": 0.06573157506514887, + "eval_loss": 0.2781069874763489, + "eval_runtime": 272.2382, + "eval_samples_per_second": 60.131, + "eval_steps_per_second": 1.671, + "eval_wer": 0.1695931253795472, + "step": 16500 + }, + { + "epoch": 1.61, + "learning_rate": 2.8757818986991424e-05, + "loss": 0.1401, + "step": 16505 + }, + { + "epoch": 1.61, + "learning_rate": 2.8753667312482704e-05, + "loss": 0.1604, + "step": 16510 + }, + { + "epoch": 1.61, + "learning_rate": 2.8749515637973985e-05, + "loss": 0.1708, + "step": 16515 + }, + { + "epoch": 1.62, + "learning_rate": 2.8745363963465266e-05, + "loss": 0.1327, + "step": 16520 + }, + { + "epoch": 1.62, + "learning_rate": 2.8741212288956547e-05, + "loss": 0.1321, + "step": 16525 + }, + { + "epoch": 1.62, + "learning_rate": 2.8737060614447827e-05, + "loss": 0.1635, + "step": 16530 + }, + { + "epoch": 1.62, + "learning_rate": 2.8732908939939108e-05, + "loss": 0.1444, + "step": 16535 + }, + { + "epoch": 1.62, + "learning_rate": 2.872875726543039e-05, + "loss": 0.1402, + "step": 16540 + }, + { + "epoch": 1.62, + "learning_rate": 2.872460559092167e-05, + "loss": 0.1679, + "step": 16545 + }, + { + "epoch": 1.62, + "learning_rate": 2.8720453916412954e-05, + "loss": 0.146, + "step": 16550 + }, + { + "epoch": 1.62, + "learning_rate": 2.8716302241904238e-05, + "loss": 0.1427, + "step": 16555 + }, + { + "epoch": 1.62, + "learning_rate": 2.871215056739552e-05, + "loss": 0.1538, + "step": 16560 + }, + { + "epoch": 1.62, + "learning_rate": 2.87079988928868e-05, + "loss": 0.1558, + "step": 16565 + }, + { + "epoch": 1.62, + "learning_rate": 2.870384721837808e-05, + "loss": 0.1512, + "step": 16570 + }, + { + "epoch": 1.62, + "learning_rate": 2.869969554386936e-05, + "loss": 0.1441, + "step": 16575 + }, + { + "epoch": 1.62, + "learning_rate": 2.8695543869360642e-05, + "loss": 0.1554, + "step": 16580 + }, + { + "epoch": 1.62, + "learning_rate": 2.8691392194851923e-05, + "loss": 0.135, + "step": 16585 + }, + { + "epoch": 1.62, + "learning_rate": 2.8687240520343203e-05, + "loss": 0.1372, + "step": 16590 + }, + { + "epoch": 1.62, + "learning_rate": 2.8683088845834487e-05, + "loss": 0.1729, + "step": 16595 + }, + { + "epoch": 1.62, + "learning_rate": 2.8678937171325768e-05, + "loss": 0.167, + "step": 16600 + }, + { + "epoch": 1.62, + "learning_rate": 2.8674785496817052e-05, + "loss": 0.1626, + "step": 16605 + }, + { + "epoch": 1.62, + "learning_rate": 2.8670633822308333e-05, + "loss": 0.1518, + "step": 16610 + }, + { + "epoch": 1.62, + "learning_rate": 2.8666482147799614e-05, + "loss": 0.1566, + "step": 16615 + }, + { + "epoch": 1.63, + "learning_rate": 2.8662330473290895e-05, + "loss": 0.1519, + "step": 16620 + }, + { + "epoch": 1.63, + "learning_rate": 2.8658178798782175e-05, + "loss": 0.1448, + "step": 16625 + }, + { + "epoch": 1.63, + "learning_rate": 2.8654027124273456e-05, + "loss": 0.166, + "step": 16630 + }, + { + "epoch": 1.63, + "learning_rate": 2.864987544976474e-05, + "loss": 0.1394, + "step": 16635 + }, + { + "epoch": 1.63, + "learning_rate": 2.864572377525602e-05, + "loss": 0.1536, + "step": 16640 + }, + { + "epoch": 1.63, + "learning_rate": 2.8641572100747302e-05, + "loss": 0.1653, + "step": 16645 + }, + { + "epoch": 1.63, + "learning_rate": 2.8637420426238583e-05, + "loss": 0.1432, + "step": 16650 + }, + { + "epoch": 1.63, + "learning_rate": 2.8633268751729867e-05, + "loss": 0.1507, + "step": 16655 + }, + { + "epoch": 1.63, + "learning_rate": 2.8629117077221148e-05, + "loss": 0.1716, + "step": 16660 + }, + { + "epoch": 1.63, + "learning_rate": 2.862496540271243e-05, + "loss": 0.1456, + "step": 16665 + }, + { + "epoch": 1.63, + "learning_rate": 2.862081372820371e-05, + "loss": 0.144, + "step": 16670 + }, + { + "epoch": 1.63, + "learning_rate": 2.861666205369499e-05, + "loss": 0.1302, + "step": 16675 + }, + { + "epoch": 1.63, + "learning_rate": 2.8612510379186274e-05, + "loss": 0.187, + "step": 16680 + }, + { + "epoch": 1.63, + "learning_rate": 2.8608358704677555e-05, + "loss": 0.1327, + "step": 16685 + }, + { + "epoch": 1.63, + "learning_rate": 2.8604207030168836e-05, + "loss": 0.1505, + "step": 16690 + }, + { + "epoch": 1.63, + "learning_rate": 2.8600055355660116e-05, + "loss": 0.1661, + "step": 16695 + }, + { + "epoch": 1.63, + "learning_rate": 2.8595903681151397e-05, + "loss": 0.1537, + "step": 16700 + }, + { + "epoch": 1.63, + "learning_rate": 2.8591752006642678e-05, + "loss": 0.1442, + "step": 16705 + }, + { + "epoch": 1.63, + "learning_rate": 2.8587600332133962e-05, + "loss": 0.1663, + "step": 16710 + }, + { + "epoch": 1.63, + "learning_rate": 2.8583448657625243e-05, + "loss": 0.1623, + "step": 16715 + }, + { + "epoch": 1.63, + "learning_rate": 2.8579296983116524e-05, + "loss": 0.1356, + "step": 16720 + }, + { + "epoch": 1.64, + "learning_rate": 2.8575145308607808e-05, + "loss": 0.1507, + "step": 16725 + }, + { + "epoch": 1.64, + "learning_rate": 2.857099363409909e-05, + "loss": 0.1887, + "step": 16730 + }, + { + "epoch": 1.64, + "learning_rate": 2.856684195959037e-05, + "loss": 0.1362, + "step": 16735 + }, + { + "epoch": 1.64, + "learning_rate": 2.856269028508165e-05, + "loss": 0.1335, + "step": 16740 + }, + { + "epoch": 1.64, + "learning_rate": 2.855853861057293e-05, + "loss": 0.1735, + "step": 16745 + }, + { + "epoch": 1.64, + "learning_rate": 2.855438693606421e-05, + "loss": 0.1288, + "step": 16750 + }, + { + "epoch": 1.64, + "learning_rate": 2.8550235261555492e-05, + "loss": 0.1182, + "step": 16755 + }, + { + "epoch": 1.64, + "learning_rate": 2.8546083587046777e-05, + "loss": 0.1502, + "step": 16760 + }, + { + "epoch": 1.64, + "learning_rate": 2.8541931912538057e-05, + "loss": 0.1714, + "step": 16765 + }, + { + "epoch": 1.64, + "learning_rate": 2.853778023802934e-05, + "loss": 0.1532, + "step": 16770 + }, + { + "epoch": 1.64, + "learning_rate": 2.8533628563520622e-05, + "loss": 0.1484, + "step": 16775 + }, + { + "epoch": 1.64, + "learning_rate": 2.8529476889011903e-05, + "loss": 0.1678, + "step": 16780 + }, + { + "epoch": 1.64, + "learning_rate": 2.8525325214503184e-05, + "loss": 0.127, + "step": 16785 + }, + { + "epoch": 1.64, + "learning_rate": 2.8521173539994465e-05, + "loss": 0.1528, + "step": 16790 + }, + { + "epoch": 1.64, + "learning_rate": 2.8517021865485745e-05, + "loss": 0.2006, + "step": 16795 + }, + { + "epoch": 1.64, + "learning_rate": 2.8512870190977026e-05, + "loss": 0.1567, + "step": 16800 + }, + { + "epoch": 1.64, + "learning_rate": 2.8508718516468307e-05, + "loss": 0.1279, + "step": 16805 + }, + { + "epoch": 1.64, + "learning_rate": 2.850456684195959e-05, + "loss": 0.1748, + "step": 16810 + }, + { + "epoch": 1.64, + "learning_rate": 2.8500415167450875e-05, + "loss": 0.1546, + "step": 16815 + }, + { + "epoch": 1.64, + "learning_rate": 2.8496263492942156e-05, + "loss": 0.1444, + "step": 16820 + }, + { + "epoch": 1.65, + "learning_rate": 2.8492111818433437e-05, + "loss": 0.1405, + "step": 16825 + }, + { + "epoch": 1.65, + "learning_rate": 2.8487960143924717e-05, + "loss": 0.1623, + "step": 16830 + }, + { + "epoch": 1.65, + "learning_rate": 2.8483808469415998e-05, + "loss": 0.1414, + "step": 16835 + }, + { + "epoch": 1.65, + "learning_rate": 2.847965679490728e-05, + "loss": 0.141, + "step": 16840 + }, + { + "epoch": 1.65, + "learning_rate": 2.847550512039856e-05, + "loss": 0.1646, + "step": 16845 + }, + { + "epoch": 1.65, + "learning_rate": 2.847135344588984e-05, + "loss": 0.1545, + "step": 16850 + }, + { + "epoch": 1.65, + "learning_rate": 2.846720177138112e-05, + "loss": 0.1184, + "step": 16855 + }, + { + "epoch": 1.65, + "learning_rate": 2.846305009687241e-05, + "loss": 0.1664, + "step": 16860 + }, + { + "epoch": 1.65, + "learning_rate": 2.845889842236369e-05, + "loss": 0.1443, + "step": 16865 + }, + { + "epoch": 1.65, + "learning_rate": 2.845474674785497e-05, + "loss": 0.111, + "step": 16870 + }, + { + "epoch": 1.65, + "learning_rate": 2.845059507334625e-05, + "loss": 0.1405, + "step": 16875 + }, + { + "epoch": 1.65, + "learning_rate": 2.8446443398837532e-05, + "loss": 0.1711, + "step": 16880 + }, + { + "epoch": 1.65, + "learning_rate": 2.8442291724328813e-05, + "loss": 0.1346, + "step": 16885 + }, + { + "epoch": 1.65, + "learning_rate": 2.8438140049820093e-05, + "loss": 0.1471, + "step": 16890 + }, + { + "epoch": 1.65, + "learning_rate": 2.8433988375311374e-05, + "loss": 0.1842, + "step": 16895 + }, + { + "epoch": 1.65, + "learning_rate": 2.842983670080266e-05, + "loss": 0.1416, + "step": 16900 + }, + { + "epoch": 1.65, + "learning_rate": 2.842568502629394e-05, + "loss": 0.1425, + "step": 16905 + }, + { + "epoch": 1.65, + "learning_rate": 2.842153335178522e-05, + "loss": 0.166, + "step": 16910 + }, + { + "epoch": 1.65, + "learning_rate": 2.8417381677276504e-05, + "loss": 0.1651, + "step": 16915 + }, + { + "epoch": 1.65, + "learning_rate": 2.8413230002767785e-05, + "loss": 0.1326, + "step": 16920 + }, + { + "epoch": 1.65, + "learning_rate": 2.8409078328259066e-05, + "loss": 0.1295, + "step": 16925 + }, + { + "epoch": 1.66, + "learning_rate": 2.8404926653750346e-05, + "loss": 0.172, + "step": 16930 + }, + { + "epoch": 1.66, + "learning_rate": 2.8400774979241627e-05, + "loss": 0.1313, + "step": 16935 + }, + { + "epoch": 1.66, + "learning_rate": 2.8396623304732908e-05, + "loss": 0.1572, + "step": 16940 + }, + { + "epoch": 1.66, + "learning_rate": 2.8392471630224192e-05, + "loss": 0.1696, + "step": 16945 + }, + { + "epoch": 1.66, + "learning_rate": 2.8388319955715473e-05, + "loss": 0.1577, + "step": 16950 + }, + { + "epoch": 1.66, + "learning_rate": 2.8384168281206754e-05, + "loss": 0.1443, + "step": 16955 + }, + { + "epoch": 1.66, + "learning_rate": 2.8380016606698034e-05, + "loss": 0.1583, + "step": 16960 + }, + { + "epoch": 1.66, + "learning_rate": 2.837586493218932e-05, + "loss": 0.1591, + "step": 16965 + }, + { + "epoch": 1.66, + "learning_rate": 2.83717132576806e-05, + "loss": 0.1444, + "step": 16970 + }, + { + "epoch": 1.66, + "learning_rate": 2.836756158317188e-05, + "loss": 0.1568, + "step": 16975 + }, + { + "epoch": 1.66, + "learning_rate": 2.836340990866316e-05, + "loss": 0.1634, + "step": 16980 + }, + { + "epoch": 1.66, + "learning_rate": 2.835925823415444e-05, + "loss": 0.1387, + "step": 16985 + }, + { + "epoch": 1.66, + "learning_rate": 2.8355106559645726e-05, + "loss": 0.1407, + "step": 16990 + }, + { + "epoch": 1.66, + "learning_rate": 2.8350954885137007e-05, + "loss": 0.1542, + "step": 16995 + }, + { + "epoch": 1.66, + "learning_rate": 2.8346803210628287e-05, + "loss": 0.1246, + "step": 17000 + }, + { + "epoch": 1.66, + "eval_cer": 0.06744151630976412, + "eval_loss": 0.2941415309906006, + "eval_runtime": 331.6426, + "eval_samples_per_second": 49.36, + "eval_steps_per_second": 1.372, + "eval_wer": 0.17289069693032003, + "step": 17000 + }, + { + "epoch": 1.66, + "learning_rate": 2.8342651536119568e-05, + "loss": 0.129, + "step": 17005 + }, + { + "epoch": 1.66, + "learning_rate": 2.833849986161085e-05, + "loss": 0.1538, + "step": 17010 + }, + { + "epoch": 1.66, + "learning_rate": 2.8334348187102133e-05, + "loss": 0.1628, + "step": 17015 + }, + { + "epoch": 1.66, + "learning_rate": 2.8330196512593414e-05, + "loss": 0.1375, + "step": 17020 + }, + { + "epoch": 1.66, + "learning_rate": 2.8326044838084695e-05, + "loss": 0.1414, + "step": 17025 + }, + { + "epoch": 1.67, + "learning_rate": 2.8321893163575975e-05, + "loss": 0.1603, + "step": 17030 + }, + { + "epoch": 1.67, + "learning_rate": 2.831774148906726e-05, + "loss": 0.146, + "step": 17035 + }, + { + "epoch": 1.67, + "learning_rate": 2.831358981455854e-05, + "loss": 0.1297, + "step": 17040 + }, + { + "epoch": 1.67, + "learning_rate": 2.830943814004982e-05, + "loss": 0.1685, + "step": 17045 + }, + { + "epoch": 1.67, + "learning_rate": 2.8305286465541102e-05, + "loss": 0.1452, + "step": 17050 + }, + { + "epoch": 1.67, + "learning_rate": 2.8301134791032383e-05, + "loss": 0.1344, + "step": 17055 + }, + { + "epoch": 1.67, + "learning_rate": 2.8296983116523663e-05, + "loss": 0.1552, + "step": 17060 + }, + { + "epoch": 1.67, + "learning_rate": 2.8292831442014947e-05, + "loss": 0.1468, + "step": 17065 + }, + { + "epoch": 1.67, + "learning_rate": 2.8288679767506228e-05, + "loss": 0.1211, + "step": 17070 + }, + { + "epoch": 1.67, + "learning_rate": 2.828452809299751e-05, + "loss": 0.1291, + "step": 17075 + }, + { + "epoch": 1.67, + "learning_rate": 2.8280376418488793e-05, + "loss": 0.1848, + "step": 17080 + }, + { + "epoch": 1.67, + "learning_rate": 2.8276224743980074e-05, + "loss": 0.142, + "step": 17085 + }, + { + "epoch": 1.67, + "learning_rate": 2.8272073069471355e-05, + "loss": 0.1352, + "step": 17090 + }, + { + "epoch": 1.67, + "learning_rate": 2.8267921394962635e-05, + "loss": 0.1812, + "step": 17095 + }, + { + "epoch": 1.67, + "learning_rate": 2.8263769720453916e-05, + "loss": 0.1354, + "step": 17100 + }, + { + "epoch": 1.67, + "learning_rate": 2.8259618045945197e-05, + "loss": 0.135, + "step": 17105 + }, + { + "epoch": 1.67, + "learning_rate": 2.8255466371436478e-05, + "loss": 0.1545, + "step": 17110 + }, + { + "epoch": 1.67, + "learning_rate": 2.8251314696927762e-05, + "loss": 0.1585, + "step": 17115 + }, + { + "epoch": 1.67, + "learning_rate": 2.8247163022419046e-05, + "loss": 0.1314, + "step": 17120 + }, + { + "epoch": 1.67, + "learning_rate": 2.8243011347910327e-05, + "loss": 0.1443, + "step": 17125 + }, + { + "epoch": 1.68, + "learning_rate": 2.8238859673401608e-05, + "loss": 0.189, + "step": 17130 + }, + { + "epoch": 1.68, + "learning_rate": 2.823470799889289e-05, + "loss": 0.1241, + "step": 17135 + }, + { + "epoch": 1.68, + "learning_rate": 2.823055632438417e-05, + "loss": 0.1259, + "step": 17140 + }, + { + "epoch": 1.68, + "learning_rate": 2.822640464987545e-05, + "loss": 0.1705, + "step": 17145 + }, + { + "epoch": 1.68, + "learning_rate": 2.822225297536673e-05, + "loss": 0.1592, + "step": 17150 + }, + { + "epoch": 1.68, + "learning_rate": 2.821810130085801e-05, + "loss": 0.1298, + "step": 17155 + }, + { + "epoch": 1.68, + "learning_rate": 2.8213949626349292e-05, + "loss": 0.151, + "step": 17160 + }, + { + "epoch": 1.68, + "learning_rate": 2.8209797951840576e-05, + "loss": 0.1576, + "step": 17165 + }, + { + "epoch": 1.68, + "learning_rate": 2.820564627733186e-05, + "loss": 0.1374, + "step": 17170 + }, + { + "epoch": 1.68, + "learning_rate": 2.820149460282314e-05, + "loss": 0.1568, + "step": 17175 + }, + { + "epoch": 1.68, + "learning_rate": 2.8197342928314422e-05, + "loss": 0.1865, + "step": 17180 + }, + { + "epoch": 1.68, + "learning_rate": 2.8193191253805703e-05, + "loss": 0.1418, + "step": 17185 + }, + { + "epoch": 1.68, + "learning_rate": 2.8189039579296984e-05, + "loss": 0.1319, + "step": 17190 + }, + { + "epoch": 1.68, + "learning_rate": 2.8184887904788264e-05, + "loss": 0.1606, + "step": 17195 + }, + { + "epoch": 1.68, + "learning_rate": 2.8180736230279545e-05, + "loss": 0.1314, + "step": 17200 + }, + { + "epoch": 1.68, + "learning_rate": 2.8176584555770826e-05, + "loss": 0.1512, + "step": 17205 + }, + { + "epoch": 1.68, + "learning_rate": 2.817243288126211e-05, + "loss": 0.1556, + "step": 17210 + }, + { + "epoch": 1.68, + "learning_rate": 2.816828120675339e-05, + "loss": 0.1574, + "step": 17215 + }, + { + "epoch": 1.68, + "learning_rate": 2.8164129532244675e-05, + "loss": 0.1411, + "step": 17220 + }, + { + "epoch": 1.68, + "learning_rate": 2.8159977857735956e-05, + "loss": 0.154, + "step": 17225 + }, + { + "epoch": 1.68, + "learning_rate": 2.8155826183227237e-05, + "loss": 0.187, + "step": 17230 + }, + { + "epoch": 1.69, + "learning_rate": 2.8151674508718517e-05, + "loss": 0.1451, + "step": 17235 + }, + { + "epoch": 1.69, + "learning_rate": 2.8147522834209798e-05, + "loss": 0.1406, + "step": 17240 + }, + { + "epoch": 1.69, + "learning_rate": 2.814337115970108e-05, + "loss": 0.177, + "step": 17245 + }, + { + "epoch": 1.69, + "learning_rate": 2.813921948519236e-05, + "loss": 0.143, + "step": 17250 + }, + { + "epoch": 1.69, + "learning_rate": 2.8135067810683644e-05, + "loss": 0.1315, + "step": 17255 + }, + { + "epoch": 1.69, + "learning_rate": 2.8130916136174925e-05, + "loss": 0.1643, + "step": 17260 + }, + { + "epoch": 1.69, + "learning_rate": 2.8126764461666205e-05, + "loss": 0.1504, + "step": 17265 + }, + { + "epoch": 1.69, + "learning_rate": 2.812261278715749e-05, + "loss": 0.1457, + "step": 17270 + }, + { + "epoch": 1.69, + "learning_rate": 2.811846111264877e-05, + "loss": 0.1539, + "step": 17275 + }, + { + "epoch": 1.69, + "learning_rate": 2.811430943814005e-05, + "loss": 0.1876, + "step": 17280 + }, + { + "epoch": 1.69, + "learning_rate": 2.8110157763631332e-05, + "loss": 0.141, + "step": 17285 + }, + { + "epoch": 1.69, + "learning_rate": 2.8106006089122613e-05, + "loss": 0.1548, + "step": 17290 + }, + { + "epoch": 1.69, + "learning_rate": 2.8101854414613893e-05, + "loss": 0.174, + "step": 17295 + }, + { + "epoch": 1.69, + "learning_rate": 2.8097702740105177e-05, + "loss": 0.1394, + "step": 17300 + }, + { + "epoch": 1.69, + "learning_rate": 2.8093551065596458e-05, + "loss": 0.1335, + "step": 17305 + }, + { + "epoch": 1.69, + "learning_rate": 2.808939939108774e-05, + "loss": 0.1443, + "step": 17310 + }, + { + "epoch": 1.69, + "learning_rate": 2.808524771657902e-05, + "loss": 0.1711, + "step": 17315 + }, + { + "epoch": 1.69, + "learning_rate": 2.80810960420703e-05, + "loss": 0.1483, + "step": 17320 + }, + { + "epoch": 1.69, + "learning_rate": 2.8076944367561585e-05, + "loss": 0.1402, + "step": 17325 + }, + { + "epoch": 1.69, + "learning_rate": 2.8072792693052865e-05, + "loss": 0.1646, + "step": 17330 + }, + { + "epoch": 1.7, + "learning_rate": 2.8068641018544146e-05, + "loss": 0.1298, + "step": 17335 + }, + { + "epoch": 1.7, + "learning_rate": 2.806448934403543e-05, + "loss": 0.1202, + "step": 17340 + }, + { + "epoch": 1.7, + "learning_rate": 2.806033766952671e-05, + "loss": 0.1652, + "step": 17345 + }, + { + "epoch": 1.7, + "learning_rate": 2.8056185995017992e-05, + "loss": 0.1461, + "step": 17350 + }, + { + "epoch": 1.7, + "learning_rate": 2.8052034320509273e-05, + "loss": 0.1375, + "step": 17355 + }, + { + "epoch": 1.7, + "learning_rate": 2.8047882646000553e-05, + "loss": 0.1374, + "step": 17360 + }, + { + "epoch": 1.7, + "learning_rate": 2.8043730971491834e-05, + "loss": 0.1636, + "step": 17365 + }, + { + "epoch": 1.7, + "learning_rate": 2.8039579296983115e-05, + "loss": 0.1255, + "step": 17370 + }, + { + "epoch": 1.7, + "learning_rate": 2.80354276224744e-05, + "loss": 0.1479, + "step": 17375 + }, + { + "epoch": 1.7, + "learning_rate": 2.803127594796568e-05, + "loss": 0.1645, + "step": 17380 + }, + { + "epoch": 1.7, + "learning_rate": 2.8027124273456964e-05, + "loss": 0.1431, + "step": 17385 + }, + { + "epoch": 1.7, + "learning_rate": 2.8022972598948245e-05, + "loss": 0.1294, + "step": 17390 + }, + { + "epoch": 1.7, + "learning_rate": 2.8018820924439526e-05, + "loss": 0.1796, + "step": 17395 + }, + { + "epoch": 1.7, + "learning_rate": 2.8014669249930806e-05, + "loss": 0.1531, + "step": 17400 + }, + { + "epoch": 1.7, + "learning_rate": 2.8010517575422087e-05, + "loss": 0.1386, + "step": 17405 + }, + { + "epoch": 1.7, + "learning_rate": 2.8006365900913368e-05, + "loss": 0.1555, + "step": 17410 + }, + { + "epoch": 1.7, + "learning_rate": 2.800221422640465e-05, + "loss": 0.1579, + "step": 17415 + }, + { + "epoch": 1.7, + "learning_rate": 2.799806255189593e-05, + "loss": 0.1279, + "step": 17420 + }, + { + "epoch": 1.7, + "learning_rate": 2.7993910877387214e-05, + "loss": 0.1355, + "step": 17425 + }, + { + "epoch": 1.7, + "learning_rate": 2.7989759202878498e-05, + "loss": 0.1749, + "step": 17430 + }, + { + "epoch": 1.7, + "learning_rate": 2.798560752836978e-05, + "loss": 0.1338, + "step": 17435 + }, + { + "epoch": 1.71, + "learning_rate": 2.798145585386106e-05, + "loss": 0.1465, + "step": 17440 + }, + { + "epoch": 1.71, + "learning_rate": 2.797730417935234e-05, + "loss": 0.175, + "step": 17445 + }, + { + "epoch": 1.71, + "learning_rate": 2.797315250484362e-05, + "loss": 0.1374, + "step": 17450 + }, + { + "epoch": 1.71, + "learning_rate": 2.79690008303349e-05, + "loss": 0.1267, + "step": 17455 + }, + { + "epoch": 1.71, + "learning_rate": 2.7964849155826182e-05, + "loss": 0.1477, + "step": 17460 + }, + { + "epoch": 1.71, + "learning_rate": 2.7960697481317463e-05, + "loss": 0.1827, + "step": 17465 + }, + { + "epoch": 1.71, + "learning_rate": 2.7956545806808744e-05, + "loss": 0.1315, + "step": 17470 + }, + { + "epoch": 1.71, + "learning_rate": 2.795239413230003e-05, + "loss": 0.1605, + "step": 17475 + }, + { + "epoch": 1.71, + "learning_rate": 2.7948242457791312e-05, + "loss": 0.1774, + "step": 17480 + }, + { + "epoch": 1.71, + "learning_rate": 2.7944090783282593e-05, + "loss": 0.1319, + "step": 17485 + }, + { + "epoch": 1.71, + "learning_rate": 2.7939939108773874e-05, + "loss": 0.1294, + "step": 17490 + }, + { + "epoch": 1.71, + "learning_rate": 2.7935787434265155e-05, + "loss": 0.1648, + "step": 17495 + }, + { + "epoch": 1.71, + "learning_rate": 2.7931635759756435e-05, + "loss": 0.1538, + "step": 17500 + }, + { + "epoch": 1.71, + "eval_cer": 0.06619634611338102, + "eval_loss": 0.28032588958740234, + "eval_runtime": 273.8869, + "eval_samples_per_second": 59.769, + "eval_steps_per_second": 1.661, + "eval_wer": 0.17073584819417145, + "step": 17500 + }, + { + "epoch": 1.71, + "learning_rate": 2.7927484085247716e-05, + "loss": 0.134, + "step": 17505 + }, + { + "epoch": 1.71, + "learning_rate": 2.7923332410738997e-05, + "loss": 0.1464, + "step": 17510 + }, + { + "epoch": 1.71, + "learning_rate": 2.7919180736230278e-05, + "loss": 0.165, + "step": 17515 + }, + { + "epoch": 1.71, + "learning_rate": 2.7915029061721562e-05, + "loss": 0.1527, + "step": 17520 + }, + { + "epoch": 1.71, + "learning_rate": 2.7910877387212843e-05, + "loss": 0.151, + "step": 17525 + }, + { + "epoch": 1.71, + "learning_rate": 2.7906725712704127e-05, + "loss": 0.1948, + "step": 17530 + }, + { + "epoch": 1.71, + "learning_rate": 2.7902574038195407e-05, + "loss": 0.1551, + "step": 17535 + }, + { + "epoch": 1.72, + "learning_rate": 2.7898422363686688e-05, + "loss": 0.1429, + "step": 17540 + }, + { + "epoch": 1.72, + "learning_rate": 2.789427068917797e-05, + "loss": 0.166, + "step": 17545 + }, + { + "epoch": 1.72, + "learning_rate": 2.789011901466925e-05, + "loss": 0.1483, + "step": 17550 + }, + { + "epoch": 1.72, + "learning_rate": 2.788596734016053e-05, + "loss": 0.1277, + "step": 17555 + }, + { + "epoch": 1.72, + "learning_rate": 2.788181566565181e-05, + "loss": 0.1394, + "step": 17560 + }, + { + "epoch": 1.72, + "learning_rate": 2.7877663991143095e-05, + "loss": 0.1494, + "step": 17565 + }, + { + "epoch": 1.72, + "learning_rate": 2.7873512316634376e-05, + "loss": 0.1499, + "step": 17570 + }, + { + "epoch": 1.72, + "learning_rate": 2.7869360642125657e-05, + "loss": 0.1385, + "step": 17575 + }, + { + "epoch": 1.72, + "learning_rate": 2.786520896761694e-05, + "loss": 0.1476, + "step": 17580 + }, + { + "epoch": 1.72, + "learning_rate": 2.7861057293108222e-05, + "loss": 0.1441, + "step": 17585 + }, + { + "epoch": 1.72, + "learning_rate": 2.7856905618599503e-05, + "loss": 0.1355, + "step": 17590 + }, + { + "epoch": 1.72, + "learning_rate": 2.7852753944090783e-05, + "loss": 0.1601, + "step": 17595 + }, + { + "epoch": 1.72, + "learning_rate": 2.7848602269582064e-05, + "loss": 0.1441, + "step": 17600 + }, + { + "epoch": 1.72, + "learning_rate": 2.784445059507335e-05, + "loss": 0.1209, + "step": 17605 + }, + { + "epoch": 1.72, + "learning_rate": 2.784029892056463e-05, + "loss": 0.1416, + "step": 17610 + }, + { + "epoch": 1.72, + "learning_rate": 2.783614724605591e-05, + "loss": 0.1746, + "step": 17615 + }, + { + "epoch": 1.72, + "learning_rate": 2.783199557154719e-05, + "loss": 0.13, + "step": 17620 + }, + { + "epoch": 1.72, + "learning_rate": 2.782784389703847e-05, + "loss": 0.1278, + "step": 17625 + }, + { + "epoch": 1.72, + "learning_rate": 2.7823692222529756e-05, + "loss": 0.1643, + "step": 17630 + }, + { + "epoch": 1.72, + "learning_rate": 2.7819540548021036e-05, + "loss": 0.1351, + "step": 17635 + }, + { + "epoch": 1.72, + "learning_rate": 2.7815388873512317e-05, + "loss": 0.1401, + "step": 17640 + }, + { + "epoch": 1.73, + "learning_rate": 2.7811237199003598e-05, + "loss": 0.1617, + "step": 17645 + }, + { + "epoch": 1.73, + "learning_rate": 2.7807085524494882e-05, + "loss": 0.1424, + "step": 17650 + }, + { + "epoch": 1.73, + "learning_rate": 2.7802933849986163e-05, + "loss": 0.142, + "step": 17655 + }, + { + "epoch": 1.73, + "learning_rate": 2.7798782175477444e-05, + "loss": 0.1469, + "step": 17660 + }, + { + "epoch": 1.73, + "learning_rate": 2.7794630500968724e-05, + "loss": 0.1474, + "step": 17665 + }, + { + "epoch": 1.73, + "learning_rate": 2.7790478826460005e-05, + "loss": 0.144, + "step": 17670 + }, + { + "epoch": 1.73, + "learning_rate": 2.7786327151951286e-05, + "loss": 0.1322, + "step": 17675 + }, + { + "epoch": 1.73, + "learning_rate": 2.778217547744257e-05, + "loss": 0.1645, + "step": 17680 + }, + { + "epoch": 1.73, + "learning_rate": 2.777802380293385e-05, + "loss": 0.1399, + "step": 17685 + }, + { + "epoch": 1.73, + "learning_rate": 2.777387212842513e-05, + "loss": 0.1474, + "step": 17690 + }, + { + "epoch": 1.73, + "learning_rate": 2.7769720453916416e-05, + "loss": 0.1617, + "step": 17695 + }, + { + "epoch": 1.73, + "learning_rate": 2.7765568779407697e-05, + "loss": 0.1503, + "step": 17700 + }, + { + "epoch": 1.73, + "learning_rate": 2.7761417104898977e-05, + "loss": 0.1316, + "step": 17705 + }, + { + "epoch": 1.73, + "learning_rate": 2.7757265430390258e-05, + "loss": 0.138, + "step": 17710 + }, + { + "epoch": 1.73, + "learning_rate": 2.775311375588154e-05, + "loss": 0.1441, + "step": 17715 + }, + { + "epoch": 1.73, + "learning_rate": 2.774896208137282e-05, + "loss": 0.1308, + "step": 17720 + }, + { + "epoch": 1.73, + "learning_rate": 2.77448104068641e-05, + "loss": 0.1392, + "step": 17725 + }, + { + "epoch": 1.73, + "learning_rate": 2.7740658732355385e-05, + "loss": 0.1792, + "step": 17730 + }, + { + "epoch": 1.73, + "learning_rate": 2.7736507057846665e-05, + "loss": 0.1274, + "step": 17735 + }, + { + "epoch": 1.73, + "learning_rate": 2.773235538333795e-05, + "loss": 0.1482, + "step": 17740 + }, + { + "epoch": 1.74, + "learning_rate": 2.772820370882923e-05, + "loss": 0.1847, + "step": 17745 + }, + { + "epoch": 1.74, + "learning_rate": 2.772405203432051e-05, + "loss": 0.1482, + "step": 17750 + }, + { + "epoch": 1.74, + "learning_rate": 2.7719900359811792e-05, + "loss": 0.1415, + "step": 17755 + }, + { + "epoch": 1.74, + "learning_rate": 2.7715748685303073e-05, + "loss": 0.1646, + "step": 17760 + }, + { + "epoch": 1.74, + "learning_rate": 2.7711597010794353e-05, + "loss": 0.1628, + "step": 17765 + }, + { + "epoch": 1.74, + "learning_rate": 2.7707445336285634e-05, + "loss": 0.1504, + "step": 17770 + }, + { + "epoch": 1.74, + "learning_rate": 2.7703293661776915e-05, + "loss": 0.1405, + "step": 17775 + }, + { + "epoch": 1.74, + "learning_rate": 2.7699141987268196e-05, + "loss": 0.1547, + "step": 17780 + }, + { + "epoch": 1.74, + "learning_rate": 2.7694990312759483e-05, + "loss": 0.1332, + "step": 17785 + }, + { + "epoch": 1.74, + "learning_rate": 2.7690838638250764e-05, + "loss": 0.1336, + "step": 17790 + }, + { + "epoch": 1.74, + "learning_rate": 2.7686686963742045e-05, + "loss": 0.1623, + "step": 17795 + }, + { + "epoch": 1.74, + "learning_rate": 2.7682535289233325e-05, + "loss": 0.135, + "step": 17800 + }, + { + "epoch": 1.74, + "learning_rate": 2.7678383614724606e-05, + "loss": 0.1441, + "step": 17805 + }, + { + "epoch": 1.74, + "learning_rate": 2.7674231940215887e-05, + "loss": 0.1375, + "step": 17810 + }, + { + "epoch": 1.74, + "learning_rate": 2.7670080265707168e-05, + "loss": 0.1767, + "step": 17815 + }, + { + "epoch": 1.74, + "learning_rate": 2.766592859119845e-05, + "loss": 0.1318, + "step": 17820 + }, + { + "epoch": 1.74, + "learning_rate": 2.7661776916689733e-05, + "loss": 0.136, + "step": 17825 + }, + { + "epoch": 1.74, + "learning_rate": 2.7657625242181013e-05, + "loss": 0.1664, + "step": 17830 + }, + { + "epoch": 1.74, + "learning_rate": 2.7653473567672298e-05, + "loss": 0.1315, + "step": 17835 + }, + { + "epoch": 1.74, + "learning_rate": 2.764932189316358e-05, + "loss": 0.1388, + "step": 17840 + }, + { + "epoch": 1.74, + "learning_rate": 2.764517021865486e-05, + "loss": 0.1504, + "step": 17845 + }, + { + "epoch": 1.75, + "learning_rate": 2.764101854414614e-05, + "loss": 0.131, + "step": 17850 + }, + { + "epoch": 1.75, + "learning_rate": 2.763686686963742e-05, + "loss": 0.1343, + "step": 17855 + }, + { + "epoch": 1.75, + "learning_rate": 2.76327151951287e-05, + "loss": 0.1569, + "step": 17860 + }, + { + "epoch": 1.75, + "learning_rate": 2.7628563520619982e-05, + "loss": 0.1607, + "step": 17865 + }, + { + "epoch": 1.75, + "learning_rate": 2.7624411846111266e-05, + "loss": 0.1315, + "step": 17870 + }, + { + "epoch": 1.75, + "learning_rate": 2.7620260171602547e-05, + "loss": 0.163, + "step": 17875 + }, + { + "epoch": 1.75, + "learning_rate": 2.7616108497093828e-05, + "loss": 0.1646, + "step": 17880 + }, + { + "epoch": 1.75, + "learning_rate": 2.7611956822585112e-05, + "loss": 0.1367, + "step": 17885 + }, + { + "epoch": 1.75, + "learning_rate": 2.7607805148076393e-05, + "loss": 0.143, + "step": 17890 + }, + { + "epoch": 1.75, + "learning_rate": 2.7603653473567674e-05, + "loss": 0.1641, + "step": 17895 + }, + { + "epoch": 1.75, + "learning_rate": 2.7599501799058954e-05, + "loss": 0.1363, + "step": 17900 + }, + { + "epoch": 1.75, + "learning_rate": 2.7595350124550235e-05, + "loss": 0.1447, + "step": 17905 + }, + { + "epoch": 1.75, + "learning_rate": 2.7591198450041516e-05, + "loss": 0.1859, + "step": 17910 + }, + { + "epoch": 1.75, + "learning_rate": 2.75870467755328e-05, + "loss": 0.1527, + "step": 17915 + }, + { + "epoch": 1.75, + "learning_rate": 2.758289510102408e-05, + "loss": 0.1223, + "step": 17920 + }, + { + "epoch": 1.75, + "learning_rate": 2.757874342651536e-05, + "loss": 0.1337, + "step": 17925 + }, + { + "epoch": 1.75, + "learning_rate": 2.7574591752006642e-05, + "loss": 0.1646, + "step": 17930 + }, + { + "epoch": 1.75, + "learning_rate": 2.7570440077497923e-05, + "loss": 0.1378, + "step": 17935 + }, + { + "epoch": 1.75, + "learning_rate": 2.7566288402989207e-05, + "loss": 0.1266, + "step": 17940 + }, + { + "epoch": 1.75, + "learning_rate": 2.7562136728480488e-05, + "loss": 0.1457, + "step": 17945 + }, + { + "epoch": 1.76, + "learning_rate": 2.755798505397177e-05, + "loss": 0.1251, + "step": 17950 + }, + { + "epoch": 1.76, + "learning_rate": 2.755383337946305e-05, + "loss": 0.1292, + "step": 17955 + }, + { + "epoch": 1.76, + "learning_rate": 2.7549681704954334e-05, + "loss": 0.184, + "step": 17960 + }, + { + "epoch": 1.76, + "learning_rate": 2.7545530030445615e-05, + "loss": 0.1651, + "step": 17965 + }, + { + "epoch": 1.76, + "learning_rate": 2.7541378355936895e-05, + "loss": 0.1409, + "step": 17970 + }, + { + "epoch": 1.76, + "learning_rate": 2.7537226681428176e-05, + "loss": 0.141, + "step": 17975 + }, + { + "epoch": 1.76, + "learning_rate": 2.7533075006919457e-05, + "loss": 0.1577, + "step": 17980 + }, + { + "epoch": 1.76, + "learning_rate": 2.7528923332410738e-05, + "loss": 0.1378, + "step": 17985 + }, + { + "epoch": 1.76, + "learning_rate": 2.7524771657902022e-05, + "loss": 0.1679, + "step": 17990 + }, + { + "epoch": 1.76, + "learning_rate": 2.7520619983393303e-05, + "loss": 0.152, + "step": 17995 + }, + { + "epoch": 1.76, + "learning_rate": 2.7516468308884583e-05, + "loss": 0.143, + "step": 18000 + }, + { + "epoch": 1.76, + "eval_cer": 0.06502170087705303, + "eval_loss": 0.27048301696777344, + "eval_runtime": 276.7204, + "eval_samples_per_second": 59.157, + "eval_steps_per_second": 1.644, + "eval_wer": 0.16690282938168902, + "step": 18000 + }, + { + "epoch": 1.76, + "learning_rate": 2.7512316634375867e-05, + "loss": 0.1217, + "step": 18005 + }, + { + "epoch": 1.76, + "learning_rate": 2.7508164959867148e-05, + "loss": 0.1326, + "step": 18010 + }, + { + "epoch": 1.76, + "learning_rate": 2.750401328535843e-05, + "loss": 0.1415, + "step": 18015 + }, + { + "epoch": 1.76, + "learning_rate": 2.749986161084971e-05, + "loss": 0.1284, + "step": 18020 + }, + { + "epoch": 1.76, + "learning_rate": 2.749570993634099e-05, + "loss": 0.1377, + "step": 18025 + }, + { + "epoch": 1.76, + "learning_rate": 2.749155826183227e-05, + "loss": 0.1581, + "step": 18030 + }, + { + "epoch": 1.76, + "learning_rate": 2.7487406587323552e-05, + "loss": 0.1349, + "step": 18035 + }, + { + "epoch": 1.76, + "learning_rate": 2.7483254912814836e-05, + "loss": 0.1207, + "step": 18040 + }, + { + "epoch": 1.76, + "learning_rate": 2.747910323830612e-05, + "loss": 0.1741, + "step": 18045 + }, + { + "epoch": 1.76, + "learning_rate": 2.74749515637974e-05, + "loss": 0.1472, + "step": 18050 + }, + { + "epoch": 1.77, + "learning_rate": 2.7470799889288682e-05, + "loss": 0.1252, + "step": 18055 + }, + { + "epoch": 1.77, + "learning_rate": 2.7466648214779963e-05, + "loss": 0.1572, + "step": 18060 + }, + { + "epoch": 1.77, + "learning_rate": 2.7462496540271243e-05, + "loss": 0.1609, + "step": 18065 + }, + { + "epoch": 1.77, + "learning_rate": 2.7458344865762524e-05, + "loss": 0.13, + "step": 18070 + }, + { + "epoch": 1.77, + "learning_rate": 2.7454193191253805e-05, + "loss": 0.1454, + "step": 18075 + }, + { + "epoch": 1.77, + "learning_rate": 2.7450041516745086e-05, + "loss": 0.1798, + "step": 18080 + }, + { + "epoch": 1.77, + "learning_rate": 2.7445889842236367e-05, + "loss": 0.1299, + "step": 18085 + }, + { + "epoch": 1.77, + "learning_rate": 2.7441738167727654e-05, + "loss": 0.1352, + "step": 18090 + }, + { + "epoch": 1.77, + "learning_rate": 2.7437586493218935e-05, + "loss": 0.1603, + "step": 18095 + }, + { + "epoch": 1.77, + "learning_rate": 2.7433434818710216e-05, + "loss": 0.1549, + "step": 18100 + }, + { + "epoch": 1.77, + "learning_rate": 2.7429283144201496e-05, + "loss": 0.1406, + "step": 18105 + }, + { + "epoch": 1.77, + "learning_rate": 2.7425131469692777e-05, + "loss": 0.1741, + "step": 18110 + }, + { + "epoch": 1.77, + "learning_rate": 2.7420979795184058e-05, + "loss": 0.1553, + "step": 18115 + }, + { + "epoch": 1.77, + "learning_rate": 2.741682812067534e-05, + "loss": 0.1421, + "step": 18120 + }, + { + "epoch": 1.77, + "learning_rate": 2.741267644616662e-05, + "loss": 0.1365, + "step": 18125 + }, + { + "epoch": 1.77, + "learning_rate": 2.74085247716579e-05, + "loss": 0.1624, + "step": 18130 + }, + { + "epoch": 1.77, + "learning_rate": 2.7404373097149184e-05, + "loss": 0.1457, + "step": 18135 + }, + { + "epoch": 1.77, + "learning_rate": 2.7400221422640465e-05, + "loss": 0.1327, + "step": 18140 + }, + { + "epoch": 1.77, + "learning_rate": 2.739606974813175e-05, + "loss": 0.1457, + "step": 18145 + }, + { + "epoch": 1.77, + "learning_rate": 2.739191807362303e-05, + "loss": 0.1648, + "step": 18150 + }, + { + "epoch": 1.78, + "learning_rate": 2.738776639911431e-05, + "loss": 0.1474, + "step": 18155 + }, + { + "epoch": 1.78, + "learning_rate": 2.738361472460559e-05, + "loss": 0.1646, + "step": 18160 + }, + { + "epoch": 1.78, + "learning_rate": 2.7379463050096872e-05, + "loss": 0.1567, + "step": 18165 + }, + { + "epoch": 1.78, + "learning_rate": 2.7375311375588153e-05, + "loss": 0.1343, + "step": 18170 + }, + { + "epoch": 1.78, + "learning_rate": 2.7371159701079434e-05, + "loss": 0.1385, + "step": 18175 + }, + { + "epoch": 1.78, + "learning_rate": 2.7367008026570718e-05, + "loss": 0.1564, + "step": 18180 + }, + { + "epoch": 1.78, + "learning_rate": 2.7362856352062e-05, + "loss": 0.1382, + "step": 18185 + }, + { + "epoch": 1.78, + "learning_rate": 2.735870467755328e-05, + "loss": 0.1429, + "step": 18190 + }, + { + "epoch": 1.78, + "learning_rate": 2.7354553003044564e-05, + "loss": 0.1594, + "step": 18195 + }, + { + "epoch": 1.78, + "learning_rate": 2.7350401328535845e-05, + "loss": 0.1592, + "step": 18200 + }, + { + "epoch": 1.78, + "learning_rate": 2.7346249654027125e-05, + "loss": 0.1409, + "step": 18205 + }, + { + "epoch": 1.78, + "learning_rate": 2.7342097979518406e-05, + "loss": 0.128, + "step": 18210 + }, + { + "epoch": 1.78, + "learning_rate": 2.7337946305009687e-05, + "loss": 0.1689, + "step": 18215 + }, + { + "epoch": 1.78, + "learning_rate": 2.7333794630500968e-05, + "loss": 0.1343, + "step": 18220 + }, + { + "epoch": 1.78, + "learning_rate": 2.7329642955992252e-05, + "loss": 0.1354, + "step": 18225 + }, + { + "epoch": 1.78, + "learning_rate": 2.7325491281483533e-05, + "loss": 0.1611, + "step": 18230 + }, + { + "epoch": 1.78, + "learning_rate": 2.7321339606974813e-05, + "loss": 0.1533, + "step": 18235 + }, + { + "epoch": 1.78, + "learning_rate": 2.7317187932466094e-05, + "loss": 0.1302, + "step": 18240 + }, + { + "epoch": 1.78, + "learning_rate": 2.7313036257957378e-05, + "loss": 0.1738, + "step": 18245 + }, + { + "epoch": 1.78, + "learning_rate": 2.730888458344866e-05, + "loss": 0.1318, + "step": 18250 + }, + { + "epoch": 1.79, + "learning_rate": 2.730473290893994e-05, + "loss": 0.1314, + "step": 18255 + }, + { + "epoch": 1.79, + "learning_rate": 2.730058123443122e-05, + "loss": 0.1413, + "step": 18260 + }, + { + "epoch": 1.79, + "learning_rate": 2.72964295599225e-05, + "loss": 0.1553, + "step": 18265 + }, + { + "epoch": 1.79, + "learning_rate": 2.7292277885413785e-05, + "loss": 0.1516, + "step": 18270 + }, + { + "epoch": 1.79, + "learning_rate": 2.7288126210905066e-05, + "loss": 0.1357, + "step": 18275 + }, + { + "epoch": 1.79, + "learning_rate": 2.7283974536396347e-05, + "loss": 0.1694, + "step": 18280 + }, + { + "epoch": 1.79, + "learning_rate": 2.7279822861887628e-05, + "loss": 0.1414, + "step": 18285 + }, + { + "epoch": 1.79, + "learning_rate": 2.727567118737891e-05, + "loss": 0.1277, + "step": 18290 + }, + { + "epoch": 1.79, + "learning_rate": 2.7271519512870193e-05, + "loss": 0.1844, + "step": 18295 + }, + { + "epoch": 1.79, + "learning_rate": 2.7267367838361473e-05, + "loss": 0.1566, + "step": 18300 + }, + { + "epoch": 1.79, + "learning_rate": 2.7263216163852754e-05, + "loss": 0.1307, + "step": 18305 + }, + { + "epoch": 1.79, + "learning_rate": 2.725906448934404e-05, + "loss": 0.1659, + "step": 18310 + }, + { + "epoch": 1.79, + "learning_rate": 2.725491281483532e-05, + "loss": 0.1561, + "step": 18315 + }, + { + "epoch": 1.79, + "learning_rate": 2.72507611403266e-05, + "loss": 0.1329, + "step": 18320 + }, + { + "epoch": 1.79, + "learning_rate": 2.724660946581788e-05, + "loss": 0.144, + "step": 18325 + }, + { + "epoch": 1.79, + "learning_rate": 2.724245779130916e-05, + "loss": 0.1548, + "step": 18330 + }, + { + "epoch": 1.79, + "learning_rate": 2.7238306116800442e-05, + "loss": 0.143, + "step": 18335 + }, + { + "epoch": 1.79, + "learning_rate": 2.7234154442291723e-05, + "loss": 0.1488, + "step": 18340 + }, + { + "epoch": 1.79, + "learning_rate": 2.7230002767783007e-05, + "loss": 0.1715, + "step": 18345 + }, + { + "epoch": 1.79, + "learning_rate": 2.7225851093274288e-05, + "loss": 0.137, + "step": 18350 + }, + { + "epoch": 1.79, + "learning_rate": 2.7221699418765572e-05, + "loss": 0.1378, + "step": 18355 + }, + { + "epoch": 1.8, + "learning_rate": 2.7217547744256853e-05, + "loss": 0.1301, + "step": 18360 + }, + { + "epoch": 1.8, + "learning_rate": 2.7213396069748134e-05, + "loss": 0.1493, + "step": 18365 + }, + { + "epoch": 1.8, + "learning_rate": 2.7209244395239414e-05, + "loss": 0.1442, + "step": 18370 + }, + { + "epoch": 1.8, + "learning_rate": 2.7205092720730695e-05, + "loss": 0.1545, + "step": 18375 + }, + { + "epoch": 1.8, + "learning_rate": 2.7200941046221976e-05, + "loss": 0.1703, + "step": 18380 + }, + { + "epoch": 1.8, + "learning_rate": 2.7196789371713257e-05, + "loss": 0.132, + "step": 18385 + }, + { + "epoch": 1.8, + "learning_rate": 2.7192637697204537e-05, + "loss": 0.1405, + "step": 18390 + }, + { + "epoch": 1.8, + "learning_rate": 2.7188486022695818e-05, + "loss": 0.1671, + "step": 18395 + }, + { + "epoch": 1.8, + "learning_rate": 2.7184334348187106e-05, + "loss": 0.1357, + "step": 18400 + }, + { + "epoch": 1.8, + "learning_rate": 2.7180182673678387e-05, + "loss": 0.1208, + "step": 18405 + }, + { + "epoch": 1.8, + "learning_rate": 2.7176030999169667e-05, + "loss": 0.1565, + "step": 18410 + }, + { + "epoch": 1.8, + "learning_rate": 2.7171879324660948e-05, + "loss": 0.16, + "step": 18415 + }, + { + "epoch": 1.8, + "learning_rate": 2.716772765015223e-05, + "loss": 0.1194, + "step": 18420 + }, + { + "epoch": 1.8, + "learning_rate": 2.716357597564351e-05, + "loss": 0.1219, + "step": 18425 + }, + { + "epoch": 1.8, + "learning_rate": 2.715942430113479e-05, + "loss": 0.154, + "step": 18430 + }, + { + "epoch": 1.8, + "learning_rate": 2.715527262662607e-05, + "loss": 0.1489, + "step": 18435 + }, + { + "epoch": 1.8, + "learning_rate": 2.7151120952117352e-05, + "loss": 0.1378, + "step": 18440 + }, + { + "epoch": 1.8, + "learning_rate": 2.7146969277608636e-05, + "loss": 0.1705, + "step": 18445 + }, + { + "epoch": 1.8, + "learning_rate": 2.714281760309992e-05, + "loss": 0.1289, + "step": 18450 + }, + { + "epoch": 1.8, + "learning_rate": 2.71386659285912e-05, + "loss": 0.127, + "step": 18455 + }, + { + "epoch": 1.81, + "learning_rate": 2.7134514254082482e-05, + "loss": 0.1492, + "step": 18460 + }, + { + "epoch": 1.81, + "learning_rate": 2.7130362579573763e-05, + "loss": 0.1597, + "step": 18465 + }, + { + "epoch": 1.81, + "learning_rate": 2.7126210905065043e-05, + "loss": 0.1365, + "step": 18470 + }, + { + "epoch": 1.81, + "learning_rate": 2.7122059230556324e-05, + "loss": 0.1409, + "step": 18475 + }, + { + "epoch": 1.81, + "learning_rate": 2.7117907556047605e-05, + "loss": 0.162, + "step": 18480 + }, + { + "epoch": 1.81, + "learning_rate": 2.7113755881538886e-05, + "loss": 0.1255, + "step": 18485 + }, + { + "epoch": 1.81, + "learning_rate": 2.710960420703017e-05, + "loss": 0.1451, + "step": 18490 + }, + { + "epoch": 1.81, + "learning_rate": 2.710545253252145e-05, + "loss": 0.1608, + "step": 18495 + }, + { + "epoch": 1.81, + "learning_rate": 2.7101300858012735e-05, + "loss": 0.1505, + "step": 18500 + }, + { + "epoch": 1.81, + "eval_cer": 0.06525293025428294, + "eval_loss": 0.26316332817077637, + "eval_runtime": 278.0286, + "eval_samples_per_second": 58.879, + "eval_steps_per_second": 1.637, + "eval_wer": 0.16865935759388284, + "step": 18500 + }, + { + "epoch": 1.81, + "learning_rate": 2.7097149183504015e-05, + "loss": 0.1347, + "step": 18505 + }, + { + "epoch": 1.81, + "learning_rate": 2.7092997508995296e-05, + "loss": 0.1509, + "step": 18510 + }, + { + "epoch": 1.81, + "learning_rate": 2.7088845834486577e-05, + "loss": 0.1491, + "step": 18515 + }, + { + "epoch": 1.81, + "learning_rate": 2.7084694159977858e-05, + "loss": 0.1515, + "step": 18520 + }, + { + "epoch": 1.81, + "learning_rate": 2.708054248546914e-05, + "loss": 0.1526, + "step": 18525 + }, + { + "epoch": 1.81, + "learning_rate": 2.7076390810960423e-05, + "loss": 0.1664, + "step": 18530 + }, + { + "epoch": 1.81, + "learning_rate": 2.7072239136451703e-05, + "loss": 0.137, + "step": 18535 + }, + { + "epoch": 1.81, + "learning_rate": 2.7068087461942984e-05, + "loss": 0.135, + "step": 18540 + }, + { + "epoch": 1.81, + "learning_rate": 2.7063935787434265e-05, + "loss": 0.1734, + "step": 18545 + }, + { + "epoch": 1.81, + "learning_rate": 2.7059784112925546e-05, + "loss": 0.149, + "step": 18550 + }, + { + "epoch": 1.81, + "learning_rate": 2.705563243841683e-05, + "loss": 0.1386, + "step": 18555 + }, + { + "epoch": 1.81, + "learning_rate": 2.705148076390811e-05, + "loss": 0.1246, + "step": 18560 + }, + { + "epoch": 1.82, + "learning_rate": 2.704732908939939e-05, + "loss": 0.1551, + "step": 18565 + }, + { + "epoch": 1.82, + "learning_rate": 2.7043177414890672e-05, + "loss": 0.1323, + "step": 18570 + }, + { + "epoch": 1.82, + "learning_rate": 2.7039025740381956e-05, + "loss": 0.1445, + "step": 18575 + }, + { + "epoch": 1.82, + "learning_rate": 2.7034874065873237e-05, + "loss": 0.1737, + "step": 18580 + }, + { + "epoch": 1.82, + "learning_rate": 2.7030722391364518e-05, + "loss": 0.1395, + "step": 18585 + }, + { + "epoch": 1.82, + "learning_rate": 2.70265707168558e-05, + "loss": 0.1339, + "step": 18590 + }, + { + "epoch": 1.82, + "learning_rate": 2.702241904234708e-05, + "loss": 0.1849, + "step": 18595 + }, + { + "epoch": 1.82, + "learning_rate": 2.701826736783836e-05, + "loss": 0.1445, + "step": 18600 + }, + { + "epoch": 1.82, + "learning_rate": 2.7014115693329644e-05, + "loss": 0.1451, + "step": 18605 + }, + { + "epoch": 1.82, + "learning_rate": 2.7009964018820925e-05, + "loss": 0.1812, + "step": 18610 + }, + { + "epoch": 1.82, + "learning_rate": 2.7005812344312206e-05, + "loss": 0.1851, + "step": 18615 + }, + { + "epoch": 1.82, + "learning_rate": 2.700166066980349e-05, + "loss": 0.1412, + "step": 18620 + }, + { + "epoch": 1.82, + "learning_rate": 2.699750899529477e-05, + "loss": 0.1532, + "step": 18625 + }, + { + "epoch": 1.82, + "learning_rate": 2.699335732078605e-05, + "loss": 0.1738, + "step": 18630 + }, + { + "epoch": 1.82, + "learning_rate": 2.6989205646277332e-05, + "loss": 0.1383, + "step": 18635 + }, + { + "epoch": 1.82, + "learning_rate": 2.6985053971768613e-05, + "loss": 0.1499, + "step": 18640 + }, + { + "epoch": 1.82, + "learning_rate": 2.6980902297259894e-05, + "loss": 0.1416, + "step": 18645 + }, + { + "epoch": 1.82, + "learning_rate": 2.6976750622751175e-05, + "loss": 0.1372, + "step": 18650 + }, + { + "epoch": 1.82, + "learning_rate": 2.697259894824246e-05, + "loss": 0.1144, + "step": 18655 + }, + { + "epoch": 1.82, + "learning_rate": 2.696844727373374e-05, + "loss": 0.182, + "step": 18660 + }, + { + "epoch": 1.83, + "learning_rate": 2.6964295599225024e-05, + "loss": 0.1488, + "step": 18665 + }, + { + "epoch": 1.83, + "learning_rate": 2.6960143924716305e-05, + "loss": 0.1359, + "step": 18670 + }, + { + "epoch": 1.83, + "learning_rate": 2.6955992250207585e-05, + "loss": 0.1388, + "step": 18675 + }, + { + "epoch": 1.83, + "learning_rate": 2.6951840575698866e-05, + "loss": 0.1878, + "step": 18680 + }, + { + "epoch": 1.83, + "learning_rate": 2.6947688901190147e-05, + "loss": 0.1315, + "step": 18685 + }, + { + "epoch": 1.83, + "learning_rate": 2.6943537226681428e-05, + "loss": 0.1323, + "step": 18690 + }, + { + "epoch": 1.83, + "learning_rate": 2.693938555217271e-05, + "loss": 0.1726, + "step": 18695 + }, + { + "epoch": 1.83, + "learning_rate": 2.693523387766399e-05, + "loss": 0.1298, + "step": 18700 + }, + { + "epoch": 1.83, + "learning_rate": 2.6931082203155273e-05, + "loss": 0.1417, + "step": 18705 + }, + { + "epoch": 1.83, + "learning_rate": 2.6926930528646557e-05, + "loss": 0.1537, + "step": 18710 + }, + { + "epoch": 1.83, + "learning_rate": 2.6922778854137838e-05, + "loss": 0.1433, + "step": 18715 + }, + { + "epoch": 1.83, + "learning_rate": 2.691862717962912e-05, + "loss": 0.1187, + "step": 18720 + }, + { + "epoch": 1.83, + "learning_rate": 2.69144755051204e-05, + "loss": 0.1316, + "step": 18725 + }, + { + "epoch": 1.83, + "learning_rate": 2.691032383061168e-05, + "loss": 0.1569, + "step": 18730 + }, + { + "epoch": 1.83, + "learning_rate": 2.690617215610296e-05, + "loss": 0.1345, + "step": 18735 + }, + { + "epoch": 1.83, + "learning_rate": 2.6902020481594242e-05, + "loss": 0.1318, + "step": 18740 + }, + { + "epoch": 1.83, + "learning_rate": 2.6897868807085523e-05, + "loss": 0.1511, + "step": 18745 + }, + { + "epoch": 1.83, + "learning_rate": 2.6893717132576807e-05, + "loss": 0.1484, + "step": 18750 + }, + { + "epoch": 1.83, + "learning_rate": 2.6889565458068088e-05, + "loss": 0.1383, + "step": 18755 + }, + { + "epoch": 1.83, + "learning_rate": 2.6885413783559372e-05, + "loss": 0.1381, + "step": 18760 + }, + { + "epoch": 1.83, + "learning_rate": 2.6881262109050653e-05, + "loss": 0.1566, + "step": 18765 + }, + { + "epoch": 1.84, + "learning_rate": 2.6877110434541933e-05, + "loss": 0.1437, + "step": 18770 + }, + { + "epoch": 1.84, + "learning_rate": 2.6872958760033214e-05, + "loss": 0.151, + "step": 18775 + }, + { + "epoch": 1.84, + "learning_rate": 2.6868807085524495e-05, + "loss": 0.1869, + "step": 18780 + }, + { + "epoch": 1.84, + "learning_rate": 2.6864655411015776e-05, + "loss": 0.1438, + "step": 18785 + }, + { + "epoch": 1.84, + "learning_rate": 2.6860503736507057e-05, + "loss": 0.1188, + "step": 18790 + }, + { + "epoch": 1.84, + "learning_rate": 2.685635206199834e-05, + "loss": 0.1823, + "step": 18795 + }, + { + "epoch": 1.84, + "learning_rate": 2.685220038748962e-05, + "loss": 0.1422, + "step": 18800 + }, + { + "epoch": 1.84, + "learning_rate": 2.6848048712980902e-05, + "loss": 0.1544, + "step": 18805 + }, + { + "epoch": 1.84, + "learning_rate": 2.6843897038472186e-05, + "loss": 0.16, + "step": 18810 + }, + { + "epoch": 1.84, + "learning_rate": 2.6839745363963467e-05, + "loss": 0.15, + "step": 18815 + }, + { + "epoch": 1.84, + "learning_rate": 2.6835593689454748e-05, + "loss": 0.1574, + "step": 18820 + }, + { + "epoch": 1.84, + "learning_rate": 2.683144201494603e-05, + "loss": 0.1483, + "step": 18825 + }, + { + "epoch": 1.84, + "learning_rate": 2.682729034043731e-05, + "loss": 0.1706, + "step": 18830 + }, + { + "epoch": 1.84, + "learning_rate": 2.682313866592859e-05, + "loss": 0.1337, + "step": 18835 + }, + { + "epoch": 1.84, + "learning_rate": 2.6818986991419874e-05, + "loss": 0.1103, + "step": 18840 + }, + { + "epoch": 1.84, + "learning_rate": 2.6814835316911155e-05, + "loss": 0.161, + "step": 18845 + }, + { + "epoch": 1.84, + "learning_rate": 2.6810683642402436e-05, + "loss": 0.1473, + "step": 18850 + }, + { + "epoch": 1.84, + "learning_rate": 2.6806531967893717e-05, + "loss": 0.113, + "step": 18855 + }, + { + "epoch": 1.84, + "learning_rate": 2.6802380293385e-05, + "loss": 0.1532, + "step": 18860 + }, + { + "epoch": 1.84, + "learning_rate": 2.679822861887628e-05, + "loss": 0.1702, + "step": 18865 + }, + { + "epoch": 1.85, + "learning_rate": 2.6794076944367562e-05, + "loss": 0.1439, + "step": 18870 + }, + { + "epoch": 1.85, + "learning_rate": 2.6789925269858843e-05, + "loss": 0.1355, + "step": 18875 + }, + { + "epoch": 1.85, + "learning_rate": 2.6785773595350124e-05, + "loss": 0.1786, + "step": 18880 + }, + { + "epoch": 1.85, + "learning_rate": 2.6781621920841408e-05, + "loss": 0.1299, + "step": 18885 + }, + { + "epoch": 1.85, + "learning_rate": 2.677747024633269e-05, + "loss": 0.1247, + "step": 18890 + }, + { + "epoch": 1.85, + "learning_rate": 2.677331857182397e-05, + "loss": 0.1524, + "step": 18895 + }, + { + "epoch": 1.85, + "learning_rate": 2.676916689731525e-05, + "loss": 0.1625, + "step": 18900 + }, + { + "epoch": 1.85, + "learning_rate": 2.676501522280653e-05, + "loss": 0.1305, + "step": 18905 + }, + { + "epoch": 1.85, + "learning_rate": 2.6760863548297815e-05, + "loss": 0.1554, + "step": 18910 + }, + { + "epoch": 1.85, + "learning_rate": 2.6756711873789096e-05, + "loss": 0.1565, + "step": 18915 + }, + { + "epoch": 1.85, + "learning_rate": 2.6752560199280377e-05, + "loss": 0.1402, + "step": 18920 + }, + { + "epoch": 1.85, + "learning_rate": 2.6748408524771658e-05, + "loss": 0.1489, + "step": 18925 + }, + { + "epoch": 1.85, + "learning_rate": 2.6744256850262942e-05, + "loss": 0.1715, + "step": 18930 + }, + { + "epoch": 1.85, + "learning_rate": 2.6740105175754223e-05, + "loss": 0.1326, + "step": 18935 + }, + { + "epoch": 1.85, + "learning_rate": 2.6735953501245503e-05, + "loss": 0.1337, + "step": 18940 + }, + { + "epoch": 1.85, + "learning_rate": 2.6731801826736784e-05, + "loss": 0.1589, + "step": 18945 + }, + { + "epoch": 1.85, + "learning_rate": 2.6727650152228065e-05, + "loss": 0.1548, + "step": 18950 + }, + { + "epoch": 1.85, + "learning_rate": 2.6723498477719346e-05, + "loss": 0.1238, + "step": 18955 + }, + { + "epoch": 1.85, + "learning_rate": 2.6719346803210626e-05, + "loss": 0.1367, + "step": 18960 + }, + { + "epoch": 1.85, + "learning_rate": 2.671519512870191e-05, + "loss": 0.1596, + "step": 18965 + }, + { + "epoch": 1.85, + "learning_rate": 2.671104345419319e-05, + "loss": 0.1336, + "step": 18970 + }, + { + "epoch": 1.86, + "learning_rate": 2.6706891779684475e-05, + "loss": 0.1326, + "step": 18975 + }, + { + "epoch": 1.86, + "learning_rate": 2.6702740105175756e-05, + "loss": 0.162, + "step": 18980 + }, + { + "epoch": 1.86, + "learning_rate": 2.6698588430667037e-05, + "loss": 0.1208, + "step": 18985 + }, + { + "epoch": 1.86, + "learning_rate": 2.6694436756158318e-05, + "loss": 0.1322, + "step": 18990 + }, + { + "epoch": 1.86, + "learning_rate": 2.66902850816496e-05, + "loss": 0.1677, + "step": 18995 + }, + { + "epoch": 1.86, + "learning_rate": 2.668613340714088e-05, + "loss": 0.1415, + "step": 19000 + }, + { + "epoch": 1.86, + "eval_cer": 0.0635591750660738, + "eval_loss": 0.26230910420417786, + "eval_runtime": 279.3912, + "eval_samples_per_second": 58.592, + "eval_steps_per_second": 1.629, + "eval_wer": 0.1650810027229452, + "step": 19000 + }, + { + "epoch": 1.86, + "learning_rate": 2.668198173263216e-05, + "loss": 0.1331, + "step": 19005 + }, + { + "epoch": 1.86, + "learning_rate": 2.667783005812344e-05, + "loss": 0.1407, + "step": 19010 + }, + { + "epoch": 1.86, + "learning_rate": 2.667367838361473e-05, + "loss": 0.1543, + "step": 19015 + }, + { + "epoch": 1.86, + "learning_rate": 2.666952670910601e-05, + "loss": 0.1512, + "step": 19020 + }, + { + "epoch": 1.86, + "learning_rate": 2.666537503459729e-05, + "loss": 0.1366, + "step": 19025 + }, + { + "epoch": 1.86, + "learning_rate": 2.666122336008857e-05, + "loss": 0.1679, + "step": 19030 + }, + { + "epoch": 1.86, + "learning_rate": 2.665707168557985e-05, + "loss": 0.1367, + "step": 19035 + }, + { + "epoch": 1.86, + "learning_rate": 2.6652920011071132e-05, + "loss": 0.139, + "step": 19040 + }, + { + "epoch": 1.86, + "learning_rate": 2.6648768336562413e-05, + "loss": 0.1599, + "step": 19045 + }, + { + "epoch": 1.86, + "learning_rate": 2.6644616662053694e-05, + "loss": 0.1355, + "step": 19050 + }, + { + "epoch": 1.86, + "learning_rate": 2.6640464987544975e-05, + "loss": 0.1452, + "step": 19055 + }, + { + "epoch": 1.86, + "learning_rate": 2.663631331303626e-05, + "loss": 0.1632, + "step": 19060 + }, + { + "epoch": 1.86, + "learning_rate": 2.6632161638527543e-05, + "loss": 0.1481, + "step": 19065 + }, + { + "epoch": 1.86, + "learning_rate": 2.6628009964018824e-05, + "loss": 0.1339, + "step": 19070 + }, + { + "epoch": 1.87, + "learning_rate": 2.6623858289510104e-05, + "loss": 0.1414, + "step": 19075 + }, + { + "epoch": 1.87, + "learning_rate": 2.6619706615001385e-05, + "loss": 0.1759, + "step": 19080 + }, + { + "epoch": 1.87, + "learning_rate": 2.6615554940492666e-05, + "loss": 0.1437, + "step": 19085 + }, + { + "epoch": 1.87, + "learning_rate": 2.6611403265983947e-05, + "loss": 0.127, + "step": 19090 + }, + { + "epoch": 1.87, + "learning_rate": 2.6607251591475227e-05, + "loss": 0.1678, + "step": 19095 + }, + { + "epoch": 1.87, + "learning_rate": 2.6603099916966508e-05, + "loss": 0.1413, + "step": 19100 + }, + { + "epoch": 1.87, + "learning_rate": 2.6598948242457792e-05, + "loss": 0.125, + "step": 19105 + }, + { + "epoch": 1.87, + "learning_rate": 2.6594796567949073e-05, + "loss": 0.1419, + "step": 19110 + }, + { + "epoch": 1.87, + "learning_rate": 2.6590644893440357e-05, + "loss": 0.1672, + "step": 19115 + }, + { + "epoch": 1.87, + "learning_rate": 2.6586493218931638e-05, + "loss": 0.1427, + "step": 19120 + }, + { + "epoch": 1.87, + "learning_rate": 2.658234154442292e-05, + "loss": 0.1563, + "step": 19125 + }, + { + "epoch": 1.87, + "learning_rate": 2.65781898699142e-05, + "loss": 0.1726, + "step": 19130 + }, + { + "epoch": 1.87, + "learning_rate": 2.657403819540548e-05, + "loss": 0.1386, + "step": 19135 + }, + { + "epoch": 1.87, + "learning_rate": 2.656988652089676e-05, + "loss": 0.1234, + "step": 19140 + }, + { + "epoch": 1.87, + "learning_rate": 2.6565734846388042e-05, + "loss": 0.1536, + "step": 19145 + }, + { + "epoch": 1.87, + "learning_rate": 2.6561583171879326e-05, + "loss": 0.1369, + "step": 19150 + }, + { + "epoch": 1.87, + "learning_rate": 2.6557431497370607e-05, + "loss": 0.1295, + "step": 19155 + }, + { + "epoch": 1.87, + "learning_rate": 2.6553279822861888e-05, + "loss": 0.1457, + "step": 19160 + }, + { + "epoch": 1.87, + "learning_rate": 2.654912814835317e-05, + "loss": 0.1537, + "step": 19165 + }, + { + "epoch": 1.87, + "learning_rate": 2.6544976473844453e-05, + "loss": 0.1401, + "step": 19170 + }, + { + "epoch": 1.88, + "learning_rate": 2.6540824799335733e-05, + "loss": 0.1444, + "step": 19175 + }, + { + "epoch": 1.88, + "learning_rate": 2.6536673124827014e-05, + "loss": 0.1683, + "step": 19180 + }, + { + "epoch": 1.88, + "learning_rate": 2.6532521450318295e-05, + "loss": 0.1308, + "step": 19185 + }, + { + "epoch": 1.88, + "learning_rate": 2.6528369775809576e-05, + "loss": 0.1391, + "step": 19190 + }, + { + "epoch": 1.88, + "learning_rate": 2.652421810130086e-05, + "loss": 0.1411, + "step": 19195 + }, + { + "epoch": 1.88, + "learning_rate": 2.652006642679214e-05, + "loss": 0.1318, + "step": 19200 + }, + { + "epoch": 1.88, + "learning_rate": 2.651591475228342e-05, + "loss": 0.1363, + "step": 19205 + }, + { + "epoch": 1.88, + "learning_rate": 2.6511763077774702e-05, + "loss": 0.1375, + "step": 19210 + }, + { + "epoch": 1.88, + "learning_rate": 2.6507611403265983e-05, + "loss": 0.1511, + "step": 19215 + }, + { + "epoch": 1.88, + "learning_rate": 2.6503459728757267e-05, + "loss": 0.1381, + "step": 19220 + }, + { + "epoch": 1.88, + "learning_rate": 2.6499308054248548e-05, + "loss": 0.1291, + "step": 19225 + }, + { + "epoch": 1.88, + "learning_rate": 2.649515637973983e-05, + "loss": 0.1514, + "step": 19230 + }, + { + "epoch": 1.88, + "learning_rate": 2.6491004705231113e-05, + "loss": 0.1384, + "step": 19235 + }, + { + "epoch": 1.88, + "learning_rate": 2.6486853030722393e-05, + "loss": 0.1461, + "step": 19240 + }, + { + "epoch": 1.88, + "learning_rate": 2.6482701356213674e-05, + "loss": 0.1567, + "step": 19245 + }, + { + "epoch": 1.88, + "learning_rate": 2.6478549681704955e-05, + "loss": 0.1449, + "step": 19250 + }, + { + "epoch": 1.88, + "learning_rate": 2.6474398007196236e-05, + "loss": 0.1269, + "step": 19255 + }, + { + "epoch": 1.88, + "learning_rate": 2.6470246332687517e-05, + "loss": 0.1488, + "step": 19260 + }, + { + "epoch": 1.88, + "learning_rate": 2.6466094658178797e-05, + "loss": 0.1548, + "step": 19265 + }, + { + "epoch": 1.88, + "learning_rate": 2.646194298367008e-05, + "loss": 0.1295, + "step": 19270 + }, + { + "epoch": 1.88, + "learning_rate": 2.6458621644063106e-05, + "loss": 0.1361, + "step": 19275 + }, + { + "epoch": 1.89, + "learning_rate": 2.6454469969554387e-05, + "loss": 0.162, + "step": 19280 + }, + { + "epoch": 1.89, + "learning_rate": 2.6450318295045668e-05, + "loss": 0.1387, + "step": 19285 + }, + { + "epoch": 1.89, + "learning_rate": 2.6446166620536952e-05, + "loss": 0.1326, + "step": 19290 + }, + { + "epoch": 1.89, + "learning_rate": 2.6442014946028233e-05, + "loss": 0.1624, + "step": 19295 + }, + { + "epoch": 1.89, + "learning_rate": 2.6437863271519513e-05, + "loss": 0.1553, + "step": 19300 + }, + { + "epoch": 1.89, + "learning_rate": 2.6433711597010794e-05, + "loss": 0.1304, + "step": 19305 + }, + { + "epoch": 1.89, + "learning_rate": 2.6429559922502078e-05, + "loss": 0.1795, + "step": 19310 + }, + { + "epoch": 1.89, + "learning_rate": 2.642540824799336e-05, + "loss": 0.1665, + "step": 19315 + }, + { + "epoch": 1.89, + "learning_rate": 2.642125657348464e-05, + "loss": 0.1264, + "step": 19320 + }, + { + "epoch": 1.89, + "learning_rate": 2.641710489897592e-05, + "loss": 0.1432, + "step": 19325 + }, + { + "epoch": 1.89, + "learning_rate": 2.64129532244672e-05, + "loss": 0.1632, + "step": 19330 + }, + { + "epoch": 1.89, + "learning_rate": 2.6408801549958482e-05, + "loss": 0.1363, + "step": 19335 + }, + { + "epoch": 1.89, + "learning_rate": 2.6404649875449763e-05, + "loss": 0.1247, + "step": 19340 + }, + { + "epoch": 1.89, + "learning_rate": 2.6400498200941047e-05, + "loss": 0.155, + "step": 19345 + }, + { + "epoch": 1.89, + "learning_rate": 2.6396346526432328e-05, + "loss": 0.1499, + "step": 19350 + }, + { + "epoch": 1.89, + "learning_rate": 2.6392194851923612e-05, + "loss": 0.1283, + "step": 19355 + }, + { + "epoch": 1.89, + "learning_rate": 2.6388043177414893e-05, + "loss": 0.1658, + "step": 19360 + }, + { + "epoch": 1.89, + "learning_rate": 2.6383891502906173e-05, + "loss": 0.1387, + "step": 19365 + }, + { + "epoch": 1.89, + "learning_rate": 2.6379739828397454e-05, + "loss": 0.1396, + "step": 19370 + }, + { + "epoch": 1.89, + "learning_rate": 2.6375588153888735e-05, + "loss": 0.1191, + "step": 19375 + }, + { + "epoch": 1.9, + "learning_rate": 2.6371436479380016e-05, + "loss": 0.1611, + "step": 19380 + }, + { + "epoch": 1.9, + "learning_rate": 2.6367284804871297e-05, + "loss": 0.1426, + "step": 19385 + }, + { + "epoch": 1.9, + "learning_rate": 2.6363133130362577e-05, + "loss": 0.1338, + "step": 19390 + }, + { + "epoch": 1.9, + "learning_rate": 2.6358981455853865e-05, + "loss": 0.1751, + "step": 19395 + }, + { + "epoch": 1.9, + "learning_rate": 2.6354829781345146e-05, + "loss": 0.1327, + "step": 19400 + }, + { + "epoch": 1.9, + "learning_rate": 2.6350678106836426e-05, + "loss": 0.1432, + "step": 19405 + }, + { + "epoch": 1.9, + "learning_rate": 2.6346526432327707e-05, + "loss": 0.1735, + "step": 19410 + }, + { + "epoch": 1.9, + "learning_rate": 2.6342374757818988e-05, + "loss": 0.1577, + "step": 19415 + }, + { + "epoch": 1.9, + "learning_rate": 2.633822308331027e-05, + "loss": 0.1281, + "step": 19420 + }, + { + "epoch": 1.9, + "learning_rate": 2.633407140880155e-05, + "loss": 0.1233, + "step": 19425 + }, + { + "epoch": 1.9, + "learning_rate": 2.632991973429283e-05, + "loss": 0.1595, + "step": 19430 + }, + { + "epoch": 1.9, + "learning_rate": 2.632576805978411e-05, + "loss": 0.1427, + "step": 19435 + }, + { + "epoch": 1.9, + "learning_rate": 2.6321616385275395e-05, + "loss": 0.1415, + "step": 19440 + }, + { + "epoch": 1.9, + "learning_rate": 2.631746471076668e-05, + "loss": 0.1744, + "step": 19445 + }, + { + "epoch": 1.9, + "learning_rate": 2.631331303625796e-05, + "loss": 0.1484, + "step": 19450 + }, + { + "epoch": 1.9, + "learning_rate": 2.630916136174924e-05, + "loss": 0.1298, + "step": 19455 + }, + { + "epoch": 1.9, + "learning_rate": 2.630500968724052e-05, + "loss": 0.166, + "step": 19460 + }, + { + "epoch": 1.9, + "learning_rate": 2.6300858012731802e-05, + "loss": 0.1461, + "step": 19465 + }, + { + "epoch": 1.9, + "learning_rate": 2.6296706338223083e-05, + "loss": 0.1384, + "step": 19470 + }, + { + "epoch": 1.9, + "learning_rate": 2.6292554663714364e-05, + "loss": 0.1357, + "step": 19475 + }, + { + "epoch": 1.9, + "learning_rate": 2.6288402989205645e-05, + "loss": 0.1791, + "step": 19480 + }, + { + "epoch": 1.91, + "learning_rate": 2.628425131469693e-05, + "loss": 0.1423, + "step": 19485 + }, + { + "epoch": 1.91, + "learning_rate": 2.628009964018821e-05, + "loss": 0.1427, + "step": 19490 + }, + { + "epoch": 1.91, + "learning_rate": 2.6275947965679494e-05, + "loss": 0.1656, + "step": 19495 + }, + { + "epoch": 1.91, + "learning_rate": 2.6271796291170775e-05, + "loss": 0.1402, + "step": 19500 + }, + { + "epoch": 1.91, + "eval_cer": 0.06466676378300511, + "eval_loss": 0.2606678903102875, + "eval_runtime": 279.7722, + "eval_samples_per_second": 58.512, + "eval_steps_per_second": 1.626, + "eval_wer": 0.16681794140117406, + "step": 19500 + }, + { + "epoch": 1.91, + "learning_rate": 2.6267644616662055e-05, + "loss": 0.1523, + "step": 19505 + }, + { + "epoch": 1.91, + "learning_rate": 2.6263492942153336e-05, + "loss": 0.1448, + "step": 19510 + }, + { + "epoch": 1.91, + "learning_rate": 2.6259341267644617e-05, + "loss": 0.1546, + "step": 19515 + }, + { + "epoch": 1.91, + "learning_rate": 2.6255189593135898e-05, + "loss": 0.1431, + "step": 19520 + }, + { + "epoch": 1.91, + "learning_rate": 2.625103791862718e-05, + "loss": 0.128, + "step": 19525 + }, + { + "epoch": 1.91, + "learning_rate": 2.6246886244118463e-05, + "loss": 0.1584, + "step": 19530 + }, + { + "epoch": 1.91, + "learning_rate": 2.6242734569609743e-05, + "loss": 0.1315, + "step": 19535 + }, + { + "epoch": 1.91, + "learning_rate": 2.6238582895101024e-05, + "loss": 0.1321, + "step": 19540 + }, + { + "epoch": 1.91, + "learning_rate": 2.6234431220592305e-05, + "loss": 0.1649, + "step": 19545 + }, + { + "epoch": 1.91, + "learning_rate": 2.623027954608359e-05, + "loss": 0.1507, + "step": 19550 + }, + { + "epoch": 1.91, + "learning_rate": 2.622612787157487e-05, + "loss": 0.1535, + "step": 19555 + }, + { + "epoch": 1.91, + "learning_rate": 2.622197619706615e-05, + "loss": 0.1358, + "step": 19560 + }, + { + "epoch": 1.91, + "learning_rate": 2.621782452255743e-05, + "loss": 0.167, + "step": 19565 + }, + { + "epoch": 1.91, + "learning_rate": 2.6213672848048712e-05, + "loss": 0.1262, + "step": 19570 + }, + { + "epoch": 1.91, + "learning_rate": 2.6209521173539996e-05, + "loss": 0.1514, + "step": 19575 + }, + { + "epoch": 1.91, + "learning_rate": 2.6205369499031277e-05, + "loss": 0.1656, + "step": 19580 + }, + { + "epoch": 1.92, + "learning_rate": 2.6201217824522558e-05, + "loss": 0.1361, + "step": 19585 + }, + { + "epoch": 1.92, + "learning_rate": 2.619706615001384e-05, + "loss": 0.1424, + "step": 19590 + }, + { + "epoch": 1.92, + "learning_rate": 2.619291447550512e-05, + "loss": 0.1394, + "step": 19595 + }, + { + "epoch": 1.92, + "learning_rate": 2.6188762800996403e-05, + "loss": 0.142, + "step": 19600 + }, + { + "epoch": 1.92, + "learning_rate": 2.6184611126487684e-05, + "loss": 0.1252, + "step": 19605 + }, + { + "epoch": 1.92, + "learning_rate": 2.6180459451978965e-05, + "loss": 0.1317, + "step": 19610 + }, + { + "epoch": 1.92, + "learning_rate": 2.617630777747025e-05, + "loss": 0.1459, + "step": 19615 + }, + { + "epoch": 1.92, + "learning_rate": 2.617215610296153e-05, + "loss": 0.1396, + "step": 19620 + }, + { + "epoch": 1.92, + "learning_rate": 2.616800442845281e-05, + "loss": 0.1308, + "step": 19625 + }, + { + "epoch": 1.92, + "learning_rate": 2.616385275394409e-05, + "loss": 0.1491, + "step": 19630 + }, + { + "epoch": 1.92, + "learning_rate": 2.6159701079435372e-05, + "loss": 0.1326, + "step": 19635 + }, + { + "epoch": 1.92, + "learning_rate": 2.6155549404926653e-05, + "loss": 0.1346, + "step": 19640 + }, + { + "epoch": 1.92, + "learning_rate": 2.6151397730417934e-05, + "loss": 0.168, + "step": 19645 + }, + { + "epoch": 1.92, + "learning_rate": 2.6147246055909218e-05, + "loss": 0.1389, + "step": 19650 + }, + { + "epoch": 1.92, + "learning_rate": 2.61430943814005e-05, + "loss": 0.1385, + "step": 19655 + }, + { + "epoch": 1.92, + "learning_rate": 2.6138942706891783e-05, + "loss": 0.1346, + "step": 19660 + }, + { + "epoch": 1.92, + "learning_rate": 2.6134791032383064e-05, + "loss": 0.1433, + "step": 19665 + }, + { + "epoch": 1.92, + "learning_rate": 2.6130639357874344e-05, + "loss": 0.1417, + "step": 19670 + }, + { + "epoch": 1.92, + "learning_rate": 2.6126487683365625e-05, + "loss": 0.1348, + "step": 19675 + }, + { + "epoch": 1.92, + "learning_rate": 2.6122336008856906e-05, + "loss": 0.1676, + "step": 19680 + }, + { + "epoch": 1.92, + "learning_rate": 2.6118184334348187e-05, + "loss": 0.1293, + "step": 19685 + }, + { + "epoch": 1.93, + "learning_rate": 2.6114032659839467e-05, + "loss": 0.1224, + "step": 19690 + }, + { + "epoch": 1.93, + "learning_rate": 2.6109880985330748e-05, + "loss": 0.1463, + "step": 19695 + }, + { + "epoch": 1.93, + "learning_rate": 2.6105729310822032e-05, + "loss": 0.1493, + "step": 19700 + }, + { + "epoch": 1.93, + "learning_rate": 2.6101577636313317e-05, + "loss": 0.1428, + "step": 19705 + }, + { + "epoch": 1.93, + "learning_rate": 2.6097425961804597e-05, + "loss": 0.1421, + "step": 19710 + }, + { + "epoch": 1.93, + "learning_rate": 2.6093274287295878e-05, + "loss": 0.1453, + "step": 19715 + }, + { + "epoch": 1.93, + "learning_rate": 2.608912261278716e-05, + "loss": 0.1318, + "step": 19720 + }, + { + "epoch": 1.93, + "learning_rate": 2.608497093827844e-05, + "loss": 0.1465, + "step": 19725 + }, + { + "epoch": 1.93, + "learning_rate": 2.608081926376972e-05, + "loss": 0.171, + "step": 19730 + }, + { + "epoch": 1.93, + "learning_rate": 2.6076667589261e-05, + "loss": 0.1248, + "step": 19735 + }, + { + "epoch": 1.93, + "learning_rate": 2.6072515914752282e-05, + "loss": 0.1426, + "step": 19740 + }, + { + "epoch": 1.93, + "learning_rate": 2.6068364240243563e-05, + "loss": 0.1414, + "step": 19745 + }, + { + "epoch": 1.93, + "learning_rate": 2.6064212565734847e-05, + "loss": 0.1234, + "step": 19750 + }, + { + "epoch": 1.93, + "learning_rate": 2.606006089122613e-05, + "loss": 0.1324, + "step": 19755 + }, + { + "epoch": 1.93, + "learning_rate": 2.6055909216717412e-05, + "loss": 0.1327, + "step": 19760 + }, + { + "epoch": 1.93, + "learning_rate": 2.6051757542208693e-05, + "loss": 0.1464, + "step": 19765 + }, + { + "epoch": 1.93, + "learning_rate": 2.6047605867699973e-05, + "loss": 0.1261, + "step": 19770 + }, + { + "epoch": 1.93, + "learning_rate": 2.6043454193191254e-05, + "loss": 0.1437, + "step": 19775 + }, + { + "epoch": 1.93, + "learning_rate": 2.6039302518682535e-05, + "loss": 0.1292, + "step": 19780 + }, + { + "epoch": 1.93, + "learning_rate": 2.6035150844173816e-05, + "loss": 0.1373, + "step": 19785 + }, + { + "epoch": 1.94, + "learning_rate": 2.6030999169665096e-05, + "loss": 0.1289, + "step": 19790 + }, + { + "epoch": 1.94, + "learning_rate": 2.602684749515638e-05, + "loss": 0.1595, + "step": 19795 + }, + { + "epoch": 1.94, + "learning_rate": 2.602269582064766e-05, + "loss": 0.1573, + "step": 19800 + }, + { + "epoch": 1.94, + "learning_rate": 2.6018544146138945e-05, + "loss": 0.1279, + "step": 19805 + }, + { + "epoch": 1.94, + "learning_rate": 2.6014392471630226e-05, + "loss": 0.1549, + "step": 19810 + }, + { + "epoch": 1.94, + "learning_rate": 2.6010240797121507e-05, + "loss": 0.1579, + "step": 19815 + }, + { + "epoch": 1.94, + "learning_rate": 2.6006089122612788e-05, + "loss": 0.1156, + "step": 19820 + }, + { + "epoch": 1.94, + "learning_rate": 2.600193744810407e-05, + "loss": 0.1358, + "step": 19825 + }, + { + "epoch": 1.94, + "learning_rate": 2.599778577359535e-05, + "loss": 0.1718, + "step": 19830 + }, + { + "epoch": 1.94, + "learning_rate": 2.5993634099086633e-05, + "loss": 0.1439, + "step": 19835 + }, + { + "epoch": 1.94, + "learning_rate": 2.5989482424577914e-05, + "loss": 0.1431, + "step": 19840 + }, + { + "epoch": 1.94, + "learning_rate": 2.5985330750069195e-05, + "loss": 0.1998, + "step": 19845 + }, + { + "epoch": 1.94, + "learning_rate": 2.5981179075560476e-05, + "loss": 0.1291, + "step": 19850 + }, + { + "epoch": 1.94, + "learning_rate": 2.597702740105176e-05, + "loss": 0.1249, + "step": 19855 + }, + { + "epoch": 1.94, + "learning_rate": 2.597287572654304e-05, + "loss": 0.1366, + "step": 19860 + }, + { + "epoch": 1.94, + "learning_rate": 2.596872405203432e-05, + "loss": 0.1468, + "step": 19865 + }, + { + "epoch": 1.94, + "learning_rate": 2.5964572377525602e-05, + "loss": 0.1402, + "step": 19870 + }, + { + "epoch": 1.94, + "learning_rate": 2.5960420703016883e-05, + "loss": 0.1493, + "step": 19875 + }, + { + "epoch": 1.94, + "learning_rate": 2.5956269028508167e-05, + "loss": 0.1745, + "step": 19880 + }, + { + "epoch": 1.94, + "learning_rate": 2.5952117353999448e-05, + "loss": 0.1306, + "step": 19885 + }, + { + "epoch": 1.94, + "learning_rate": 2.594796567949073e-05, + "loss": 0.1245, + "step": 19890 + }, + { + "epoch": 1.95, + "learning_rate": 2.594381400498201e-05, + "loss": 0.1557, + "step": 19895 + }, + { + "epoch": 1.95, + "learning_rate": 2.593966233047329e-05, + "loss": 0.1296, + "step": 19900 + }, + { + "epoch": 1.95, + "learning_rate": 2.5935510655964574e-05, + "loss": 0.1238, + "step": 19905 + }, + { + "epoch": 1.95, + "learning_rate": 2.5931358981455855e-05, + "loss": 0.1562, + "step": 19910 + }, + { + "epoch": 1.95, + "learning_rate": 2.5927207306947136e-05, + "loss": 0.1681, + "step": 19915 + }, + { + "epoch": 1.95, + "learning_rate": 2.5923055632438417e-05, + "loss": 0.1282, + "step": 19920 + }, + { + "epoch": 1.95, + "learning_rate": 2.59189039579297e-05, + "loss": 0.124, + "step": 19925 + }, + { + "epoch": 1.95, + "learning_rate": 2.591475228342098e-05, + "loss": 0.1507, + "step": 19930 + }, + { + "epoch": 1.95, + "learning_rate": 2.5910600608912262e-05, + "loss": 0.1294, + "step": 19935 + }, + { + "epoch": 1.95, + "learning_rate": 2.5906448934403543e-05, + "loss": 0.1573, + "step": 19940 + }, + { + "epoch": 1.95, + "learning_rate": 2.5902297259894824e-05, + "loss": 0.167, + "step": 19945 + }, + { + "epoch": 1.95, + "learning_rate": 2.5898145585386105e-05, + "loss": 0.1258, + "step": 19950 + }, + { + "epoch": 1.95, + "learning_rate": 2.5893993910877385e-05, + "loss": 0.1299, + "step": 19955 + }, + { + "epoch": 1.95, + "learning_rate": 2.588984223636867e-05, + "loss": 0.1381, + "step": 19960 + }, + { + "epoch": 1.95, + "learning_rate": 2.588569056185995e-05, + "loss": 0.1561, + "step": 19965 + }, + { + "epoch": 1.95, + "learning_rate": 2.5881538887351235e-05, + "loss": 0.1449, + "step": 19970 + }, + { + "epoch": 1.95, + "learning_rate": 2.5877387212842515e-05, + "loss": 0.1229, + "step": 19975 + }, + { + "epoch": 1.95, + "learning_rate": 2.5873235538333796e-05, + "loss": 0.1775, + "step": 19980 + }, + { + "epoch": 1.95, + "learning_rate": 2.5869083863825077e-05, + "loss": 0.1389, + "step": 19985 + }, + { + "epoch": 1.95, + "learning_rate": 2.5864932189316358e-05, + "loss": 0.1415, + "step": 19990 + }, + { + "epoch": 1.96, + "learning_rate": 2.586078051480764e-05, + "loss": 0.1516, + "step": 19995 + }, + { + "epoch": 1.96, + "learning_rate": 2.585662884029892e-05, + "loss": 0.1354, + "step": 20000 + }, + { + "epoch": 1.96, + "eval_cer": 0.0635499258909846, + "eval_loss": 0.26492738723754883, + "eval_runtime": 285.6634, + "eval_samples_per_second": 57.305, + "eval_steps_per_second": 1.593, + "eval_wer": 0.16429742136434575, + "step": 20000 + }, + { + "epoch": 1.96, + "learning_rate": 2.58524771657902e-05, + "loss": 0.1184, + "step": 20005 + }, + { + "epoch": 1.96, + "learning_rate": 2.5848325491281484e-05, + "loss": 0.1474, + "step": 20010 + }, + { + "epoch": 1.96, + "learning_rate": 2.5844173816772768e-05, + "loss": 0.1538, + "step": 20015 + }, + { + "epoch": 1.96, + "learning_rate": 2.584002214226405e-05, + "loss": 0.1321, + "step": 20020 + }, + { + "epoch": 1.96, + "learning_rate": 2.583587046775533e-05, + "loss": 0.1271, + "step": 20025 + }, + { + "epoch": 1.96, + "learning_rate": 2.583171879324661e-05, + "loss": 0.1823, + "step": 20030 + }, + { + "epoch": 1.96, + "learning_rate": 2.582756711873789e-05, + "loss": 0.1212, + "step": 20035 + }, + { + "epoch": 1.96, + "learning_rate": 2.5823415444229172e-05, + "loss": 0.1335, + "step": 20040 + }, + { + "epoch": 1.96, + "learning_rate": 2.5819263769720453e-05, + "loss": 0.1716, + "step": 20045 + }, + { + "epoch": 1.96, + "learning_rate": 2.5815112095211734e-05, + "loss": 0.1295, + "step": 20050 + }, + { + "epoch": 1.96, + "learning_rate": 2.5810960420703018e-05, + "loss": 0.14, + "step": 20055 + }, + { + "epoch": 1.96, + "learning_rate": 2.5806808746194302e-05, + "loss": 0.1556, + "step": 20060 + }, + { + "epoch": 1.96, + "learning_rate": 2.5802657071685583e-05, + "loss": 0.1492, + "step": 20065 + }, + { + "epoch": 1.96, + "learning_rate": 2.5798505397176863e-05, + "loss": 0.1205, + "step": 20070 + }, + { + "epoch": 1.96, + "learning_rate": 2.5794353722668144e-05, + "loss": 0.1509, + "step": 20075 + }, + { + "epoch": 1.96, + "learning_rate": 2.5790202048159425e-05, + "loss": 0.1643, + "step": 20080 + }, + { + "epoch": 1.96, + "learning_rate": 2.5786050373650706e-05, + "loss": 0.1288, + "step": 20085 + }, + { + "epoch": 1.96, + "learning_rate": 2.5781898699141986e-05, + "loss": 0.1364, + "step": 20090 + }, + { + "epoch": 1.96, + "learning_rate": 2.5777747024633267e-05, + "loss": 0.1657, + "step": 20095 + }, + { + "epoch": 1.97, + "learning_rate": 2.577359535012455e-05, + "loss": 0.1288, + "step": 20100 + }, + { + "epoch": 1.97, + "learning_rate": 2.5769443675615832e-05, + "loss": 0.1262, + "step": 20105 + }, + { + "epoch": 1.97, + "learning_rate": 2.5765292001107116e-05, + "loss": 0.1397, + "step": 20110 + }, + { + "epoch": 1.97, + "learning_rate": 2.5761140326598397e-05, + "loss": 0.1511, + "step": 20115 + }, + { + "epoch": 1.97, + "learning_rate": 2.5756988652089678e-05, + "loss": 0.1281, + "step": 20120 + }, + { + "epoch": 1.97, + "learning_rate": 2.575283697758096e-05, + "loss": 0.1354, + "step": 20125 + }, + { + "epoch": 1.97, + "learning_rate": 2.574868530307224e-05, + "loss": 0.1635, + "step": 20130 + }, + { + "epoch": 1.97, + "learning_rate": 2.574453362856352e-05, + "loss": 0.1364, + "step": 20135 + }, + { + "epoch": 1.97, + "learning_rate": 2.57403819540548e-05, + "loss": 0.1271, + "step": 20140 + }, + { + "epoch": 1.97, + "learning_rate": 2.5736230279546085e-05, + "loss": 0.1616, + "step": 20145 + }, + { + "epoch": 1.97, + "learning_rate": 2.5732078605037366e-05, + "loss": 0.1298, + "step": 20150 + }, + { + "epoch": 1.97, + "learning_rate": 2.572875726543039e-05, + "loss": 0.1476, + "step": 20155 + }, + { + "epoch": 1.97, + "learning_rate": 2.572460559092167e-05, + "loss": 0.1439, + "step": 20160 + }, + { + "epoch": 1.97, + "learning_rate": 2.5720453916412952e-05, + "loss": 0.1525, + "step": 20165 + }, + { + "epoch": 1.97, + "learning_rate": 2.5716302241904233e-05, + "loss": 0.1232, + "step": 20170 + }, + { + "epoch": 1.97, + "learning_rate": 2.5712150567395517e-05, + "loss": 0.1413, + "step": 20175 + }, + { + "epoch": 1.97, + "learning_rate": 2.5707998892886798e-05, + "loss": 0.1722, + "step": 20180 + }, + { + "epoch": 1.97, + "learning_rate": 2.5703847218378082e-05, + "loss": 0.138, + "step": 20185 + }, + { + "epoch": 1.97, + "learning_rate": 2.5699695543869363e-05, + "loss": 0.1283, + "step": 20190 + }, + { + "epoch": 1.97, + "learning_rate": 2.5695543869360643e-05, + "loss": 0.1418, + "step": 20195 + }, + { + "epoch": 1.98, + "learning_rate": 2.5691392194851924e-05, + "loss": 0.147, + "step": 20200 + }, + { + "epoch": 1.98, + "learning_rate": 2.5687240520343205e-05, + "loss": 0.1227, + "step": 20205 + }, + { + "epoch": 1.98, + "learning_rate": 2.5683088845834486e-05, + "loss": 0.1555, + "step": 20210 + }, + { + "epoch": 1.98, + "learning_rate": 2.567893717132577e-05, + "loss": 0.1538, + "step": 20215 + }, + { + "epoch": 1.98, + "learning_rate": 2.567478549681705e-05, + "loss": 0.127, + "step": 20220 + }, + { + "epoch": 1.98, + "learning_rate": 2.567063382230833e-05, + "loss": 0.1118, + "step": 20225 + }, + { + "epoch": 1.98, + "learning_rate": 2.5666482147799612e-05, + "loss": 0.1669, + "step": 20230 + }, + { + "epoch": 1.98, + "learning_rate": 2.5662330473290896e-05, + "loss": 0.1297, + "step": 20235 + }, + { + "epoch": 1.98, + "learning_rate": 2.5658178798782177e-05, + "loss": 0.1572, + "step": 20240 + }, + { + "epoch": 1.98, + "learning_rate": 2.5654027124273458e-05, + "loss": 0.1669, + "step": 20245 + }, + { + "epoch": 1.98, + "learning_rate": 2.564987544976474e-05, + "loss": 0.138, + "step": 20250 + }, + { + "epoch": 1.98, + "learning_rate": 2.564572377525602e-05, + "loss": 0.1497, + "step": 20255 + }, + { + "epoch": 1.98, + "learning_rate": 2.5641572100747304e-05, + "loss": 0.1494, + "step": 20260 + }, + { + "epoch": 1.98, + "learning_rate": 2.5637420426238584e-05, + "loss": 0.1608, + "step": 20265 + }, + { + "epoch": 1.98, + "learning_rate": 2.5633268751729865e-05, + "loss": 0.1135, + "step": 20270 + }, + { + "epoch": 1.98, + "learning_rate": 2.5629117077221146e-05, + "loss": 0.1456, + "step": 20275 + }, + { + "epoch": 1.98, + "learning_rate": 2.5624965402712427e-05, + "loss": 0.1586, + "step": 20280 + }, + { + "epoch": 1.98, + "learning_rate": 2.562081372820371e-05, + "loss": 0.1433, + "step": 20285 + }, + { + "epoch": 1.98, + "learning_rate": 2.561666205369499e-05, + "loss": 0.1258, + "step": 20290 + }, + { + "epoch": 1.98, + "learning_rate": 2.5612510379186272e-05, + "loss": 0.1373, + "step": 20295 + }, + { + "epoch": 1.99, + "learning_rate": 2.5608358704677553e-05, + "loss": 0.1345, + "step": 20300 + }, + { + "epoch": 1.99, + "learning_rate": 2.5604207030168837e-05, + "loss": 0.1299, + "step": 20305 + }, + { + "epoch": 1.99, + "learning_rate": 2.5600055355660118e-05, + "loss": 0.1314, + "step": 20310 + }, + { + "epoch": 1.99, + "learning_rate": 2.55959036811514e-05, + "loss": 0.136, + "step": 20315 + }, + { + "epoch": 1.99, + "learning_rate": 2.559175200664268e-05, + "loss": 0.1477, + "step": 20320 + }, + { + "epoch": 1.99, + "learning_rate": 2.558760033213396e-05, + "loss": 0.1291, + "step": 20325 + }, + { + "epoch": 1.99, + "learning_rate": 2.558344865762524e-05, + "loss": 0.1639, + "step": 20330 + }, + { + "epoch": 1.99, + "learning_rate": 2.5579296983116522e-05, + "loss": 0.125, + "step": 20335 + }, + { + "epoch": 1.99, + "learning_rate": 2.5575145308607806e-05, + "loss": 0.1259, + "step": 20340 + }, + { + "epoch": 1.99, + "learning_rate": 2.5570993634099087e-05, + "loss": 0.1668, + "step": 20345 + }, + { + "epoch": 1.99, + "learning_rate": 2.556684195959037e-05, + "loss": 0.1403, + "step": 20350 + }, + { + "epoch": 1.99, + "learning_rate": 2.5562690285081652e-05, + "loss": 0.1208, + "step": 20355 + }, + { + "epoch": 1.99, + "learning_rate": 2.5558538610572932e-05, + "loss": 0.1456, + "step": 20360 + }, + { + "epoch": 1.99, + "learning_rate": 2.5554386936064213e-05, + "loss": 0.1559, + "step": 20365 + }, + { + "epoch": 1.99, + "learning_rate": 2.5550235261555494e-05, + "loss": 0.1358, + "step": 20370 + }, + { + "epoch": 1.99, + "learning_rate": 2.5546083587046775e-05, + "loss": 0.1506, + "step": 20375 + }, + { + "epoch": 1.99, + "learning_rate": 2.5541931912538056e-05, + "loss": 0.1572, + "step": 20380 + }, + { + "epoch": 1.99, + "learning_rate": 2.5537780238029336e-05, + "loss": 0.1315, + "step": 20385 + }, + { + "epoch": 1.99, + "learning_rate": 2.553362856352062e-05, + "loss": 0.1123, + "step": 20390 + }, + { + "epoch": 1.99, + "learning_rate": 2.5529476889011905e-05, + "loss": 0.1521, + "step": 20395 + }, + { + "epoch": 1.99, + "learning_rate": 2.5525325214503185e-05, + "loss": 0.1276, + "step": 20400 + }, + { + "epoch": 2.0, + "learning_rate": 2.5521173539994466e-05, + "loss": 0.1385, + "step": 20405 + }, + { + "epoch": 2.0, + "learning_rate": 2.5517021865485747e-05, + "loss": 0.1219, + "step": 20410 + }, + { + "epoch": 2.0, + "learning_rate": 2.5512870190977028e-05, + "loss": 0.155, + "step": 20415 + }, + { + "epoch": 2.0, + "learning_rate": 2.550871851646831e-05, + "loss": 0.1328, + "step": 20420 + }, + { + "epoch": 2.0, + "learning_rate": 2.550456684195959e-05, + "loss": 0.1292, + "step": 20425 + }, + { + "epoch": 2.0, + "learning_rate": 2.550041516745087e-05, + "loss": 0.1696, + "step": 20430 + }, + { + "epoch": 2.0, + "learning_rate": 2.5496263492942154e-05, + "loss": 0.136, + "step": 20435 + }, + { + "epoch": 2.0, + "learning_rate": 2.549211181843344e-05, + "loss": 0.1491, + "step": 20440 + }, + { + "epoch": 2.0, + "learning_rate": 2.548796014392472e-05, + "loss": 0.1489, + "step": 20445 + }, + { + "epoch": 2.0, + "learning_rate": 2.5483808469416e-05, + "loss": 0.144, + "step": 20450 + }, + { + "epoch": 2.0, + "learning_rate": 2.547965679490728e-05, + "loss": 0.1528, + "step": 20455 + }, + { + "epoch": 2.0, + "learning_rate": 2.547550512039856e-05, + "loss": 0.1459, + "step": 20460 + }, + { + "epoch": 2.0, + "learning_rate": 2.5471353445889842e-05, + "loss": 0.1237, + "step": 20465 + }, + { + "epoch": 2.0, + "learning_rate": 2.5467201771381123e-05, + "loss": 0.1386, + "step": 20470 + }, + { + "epoch": 2.0, + "learning_rate": 2.5463050096872404e-05, + "loss": 0.1445, + "step": 20475 + }, + { + "epoch": 2.0, + "learning_rate": 2.5458898422363688e-05, + "loss": 0.1231, + "step": 20480 + }, + { + "epoch": 2.0, + "learning_rate": 2.545474674785497e-05, + "loss": 0.1226, + "step": 20485 + }, + { + "epoch": 2.0, + "learning_rate": 2.5450595073346253e-05, + "loss": 0.1424, + "step": 20490 + }, + { + "epoch": 2.0, + "learning_rate": 2.5446443398837534e-05, + "loss": 0.1165, + "step": 20495 + }, + { + "epoch": 2.0, + "learning_rate": 2.5442291724328814e-05, + "loss": 0.1234, + "step": 20500 + }, + { + "epoch": 2.0, + "eval_cer": 0.06356495580050454, + "eval_loss": 0.2684183716773987, + "eval_runtime": 277.269, + "eval_samples_per_second": 59.04, + "eval_steps_per_second": 1.641, + "eval_wer": 0.16158100598786754, + "step": 20500 + }, + { + "epoch": 2.01, + "learning_rate": 2.5438140049820095e-05, + "loss": 0.1451, + "step": 20505 + }, + { + "epoch": 2.01, + "learning_rate": 2.5433988375311376e-05, + "loss": 0.125, + "step": 20510 + }, + { + "epoch": 2.01, + "learning_rate": 2.5429836700802657e-05, + "loss": 0.126, + "step": 20515 + }, + { + "epoch": 2.01, + "learning_rate": 2.5425685026293937e-05, + "loss": 0.1321, + "step": 20520 + }, + { + "epoch": 2.01, + "learning_rate": 2.542153335178522e-05, + "loss": 0.1403, + "step": 20525 + }, + { + "epoch": 2.01, + "learning_rate": 2.5417381677276502e-05, + "loss": 0.1261, + "step": 20530 + }, + { + "epoch": 2.01, + "learning_rate": 2.5413230002767783e-05, + "loss": 0.1244, + "step": 20535 + }, + { + "epoch": 2.01, + "learning_rate": 2.5409078328259064e-05, + "loss": 0.1539, + "step": 20540 + }, + { + "epoch": 2.01, + "learning_rate": 2.5404926653750348e-05, + "loss": 0.1341, + "step": 20545 + }, + { + "epoch": 2.01, + "learning_rate": 2.540077497924163e-05, + "loss": 0.1185, + "step": 20550 + }, + { + "epoch": 2.01, + "learning_rate": 2.539662330473291e-05, + "loss": 0.1322, + "step": 20555 + }, + { + "epoch": 2.01, + "learning_rate": 2.539247163022419e-05, + "loss": 0.1124, + "step": 20560 + }, + { + "epoch": 2.01, + "learning_rate": 2.538831995571547e-05, + "loss": 0.1172, + "step": 20565 + }, + { + "epoch": 2.01, + "learning_rate": 2.5384168281206755e-05, + "loss": 0.1564, + "step": 20570 + }, + { + "epoch": 2.01, + "learning_rate": 2.5380016606698036e-05, + "loss": 0.1401, + "step": 20575 + }, + { + "epoch": 2.01, + "learning_rate": 2.5375864932189317e-05, + "loss": 0.1116, + "step": 20580 + }, + { + "epoch": 2.01, + "learning_rate": 2.5371713257680598e-05, + "loss": 0.1224, + "step": 20585 + }, + { + "epoch": 2.01, + "learning_rate": 2.536756158317188e-05, + "loss": 0.1502, + "step": 20590 + }, + { + "epoch": 2.01, + "learning_rate": 2.5363409908663162e-05, + "loss": 0.1299, + "step": 20595 + }, + { + "epoch": 2.01, + "learning_rate": 2.5359258234154443e-05, + "loss": 0.1171, + "step": 20600 + }, + { + "epoch": 2.01, + "learning_rate": 2.5355106559645724e-05, + "loss": 0.1484, + "step": 20605 + }, + { + "epoch": 2.02, + "learning_rate": 2.5350954885137005e-05, + "loss": 0.1203, + "step": 20610 + }, + { + "epoch": 2.02, + "learning_rate": 2.534680321062829e-05, + "loss": 0.1228, + "step": 20615 + }, + { + "epoch": 2.02, + "learning_rate": 2.534265153611957e-05, + "loss": 0.1262, + "step": 20620 + }, + { + "epoch": 2.02, + "learning_rate": 2.533849986161085e-05, + "loss": 0.1304, + "step": 20625 + }, + { + "epoch": 2.02, + "learning_rate": 2.533434818710213e-05, + "loss": 0.1215, + "step": 20630 + }, + { + "epoch": 2.02, + "learning_rate": 2.5330196512593412e-05, + "loss": 0.1348, + "step": 20635 + }, + { + "epoch": 2.02, + "learning_rate": 2.5326044838084693e-05, + "loss": 0.1843, + "step": 20640 + }, + { + "epoch": 2.02, + "learning_rate": 2.5321893163575977e-05, + "loss": 0.1349, + "step": 20645 + }, + { + "epoch": 2.02, + "learning_rate": 2.5317741489067258e-05, + "loss": 0.1364, + "step": 20650 + }, + { + "epoch": 2.02, + "learning_rate": 2.531358981455854e-05, + "loss": 0.1483, + "step": 20655 + }, + { + "epoch": 2.02, + "learning_rate": 2.5309438140049823e-05, + "loss": 0.121, + "step": 20660 + }, + { + "epoch": 2.02, + "learning_rate": 2.5305286465541103e-05, + "loss": 0.1287, + "step": 20665 + }, + { + "epoch": 2.02, + "learning_rate": 2.5301134791032384e-05, + "loss": 0.1379, + "step": 20670 + }, + { + "epoch": 2.02, + "learning_rate": 2.5296983116523665e-05, + "loss": 0.1455, + "step": 20675 + }, + { + "epoch": 2.02, + "learning_rate": 2.5292831442014946e-05, + "loss": 0.1233, + "step": 20680 + }, + { + "epoch": 2.02, + "learning_rate": 2.5288679767506226e-05, + "loss": 0.1316, + "step": 20685 + }, + { + "epoch": 2.02, + "learning_rate": 2.5284528092997507e-05, + "loss": 0.1367, + "step": 20690 + }, + { + "epoch": 2.02, + "learning_rate": 2.528037641848879e-05, + "loss": 0.1292, + "step": 20695 + }, + { + "epoch": 2.02, + "learning_rate": 2.5276224743980076e-05, + "loss": 0.123, + "step": 20700 + }, + { + "epoch": 2.02, + "learning_rate": 2.5272073069471356e-05, + "loss": 0.1368, + "step": 20705 + }, + { + "epoch": 2.03, + "learning_rate": 2.5267921394962637e-05, + "loss": 0.1418, + "step": 20710 + }, + { + "epoch": 2.03, + "learning_rate": 2.5263769720453918e-05, + "loss": 0.1224, + "step": 20715 + }, + { + "epoch": 2.03, + "learning_rate": 2.52596180459452e-05, + "loss": 0.1479, + "step": 20720 + }, + { + "epoch": 2.03, + "learning_rate": 2.525546637143648e-05, + "loss": 0.1474, + "step": 20725 + }, + { + "epoch": 2.03, + "learning_rate": 2.525131469692776e-05, + "loss": 0.1273, + "step": 20730 + }, + { + "epoch": 2.03, + "learning_rate": 2.524716302241904e-05, + "loss": 0.1179, + "step": 20735 + }, + { + "epoch": 2.03, + "learning_rate": 2.5243011347910322e-05, + "loss": 0.1443, + "step": 20740 + }, + { + "epoch": 2.03, + "learning_rate": 2.5238859673401606e-05, + "loss": 0.1245, + "step": 20745 + }, + { + "epoch": 2.03, + "learning_rate": 2.523470799889289e-05, + "loss": 0.1268, + "step": 20750 + }, + { + "epoch": 2.03, + "learning_rate": 2.523055632438417e-05, + "loss": 0.1607, + "step": 20755 + }, + { + "epoch": 2.03, + "learning_rate": 2.522640464987545e-05, + "loss": 0.1332, + "step": 20760 + }, + { + "epoch": 2.03, + "learning_rate": 2.5222252975366732e-05, + "loss": 0.1137, + "step": 20765 + }, + { + "epoch": 2.03, + "learning_rate": 2.5218101300858013e-05, + "loss": 0.124, + "step": 20770 + }, + { + "epoch": 2.03, + "learning_rate": 2.5213949626349294e-05, + "loss": 0.1493, + "step": 20775 + }, + { + "epoch": 2.03, + "learning_rate": 2.5209797951840575e-05, + "loss": 0.1235, + "step": 20780 + }, + { + "epoch": 2.03, + "learning_rate": 2.5205646277331855e-05, + "loss": 0.1151, + "step": 20785 + }, + { + "epoch": 2.03, + "learning_rate": 2.520149460282314e-05, + "loss": 0.1466, + "step": 20790 + }, + { + "epoch": 2.03, + "learning_rate": 2.519734292831442e-05, + "loss": 0.1152, + "step": 20795 + }, + { + "epoch": 2.03, + "learning_rate": 2.5193191253805704e-05, + "loss": 0.1182, + "step": 20800 + }, + { + "epoch": 2.03, + "learning_rate": 2.5189039579296985e-05, + "loss": 0.1394, + "step": 20805 + }, + { + "epoch": 2.03, + "learning_rate": 2.5184887904788266e-05, + "loss": 0.1315, + "step": 20810 + }, + { + "epoch": 2.04, + "learning_rate": 2.5180736230279547e-05, + "loss": 0.129, + "step": 20815 + }, + { + "epoch": 2.04, + "learning_rate": 2.5176584555770828e-05, + "loss": 0.1396, + "step": 20820 + }, + { + "epoch": 2.04, + "learning_rate": 2.517243288126211e-05, + "loss": 0.137, + "step": 20825 + }, + { + "epoch": 2.04, + "learning_rate": 2.516828120675339e-05, + "loss": 0.119, + "step": 20830 + }, + { + "epoch": 2.04, + "learning_rate": 2.5164129532244673e-05, + "loss": 0.1109, + "step": 20835 + }, + { + "epoch": 2.04, + "learning_rate": 2.5159977857735954e-05, + "loss": 0.1359, + "step": 20840 + }, + { + "epoch": 2.04, + "learning_rate": 2.5155826183227235e-05, + "loss": 0.1414, + "step": 20845 + }, + { + "epoch": 2.04, + "learning_rate": 2.515167450871852e-05, + "loss": 0.1093, + "step": 20850 + }, + { + "epoch": 2.04, + "learning_rate": 2.51475228342098e-05, + "loss": 0.1358, + "step": 20855 + }, + { + "epoch": 2.04, + "learning_rate": 2.514337115970108e-05, + "loss": 0.1399, + "step": 20860 + }, + { + "epoch": 2.04, + "learning_rate": 2.513921948519236e-05, + "loss": 0.135, + "step": 20865 + }, + { + "epoch": 2.04, + "learning_rate": 2.5135067810683642e-05, + "loss": 0.137, + "step": 20870 + }, + { + "epoch": 2.04, + "learning_rate": 2.5130916136174923e-05, + "loss": 0.1421, + "step": 20875 + }, + { + "epoch": 2.04, + "learning_rate": 2.5126764461666207e-05, + "loss": 0.1299, + "step": 20880 + }, + { + "epoch": 2.04, + "learning_rate": 2.5122612787157488e-05, + "loss": 0.1262, + "step": 20885 + }, + { + "epoch": 2.04, + "learning_rate": 2.511846111264877e-05, + "loss": 0.152, + "step": 20890 + }, + { + "epoch": 2.04, + "learning_rate": 2.511430943814005e-05, + "loss": 0.116, + "step": 20895 + }, + { + "epoch": 2.04, + "learning_rate": 2.5110157763631333e-05, + "loss": 0.124, + "step": 20900 + }, + { + "epoch": 2.04, + "learning_rate": 2.5106006089122614e-05, + "loss": 0.1486, + "step": 20905 + }, + { + "epoch": 2.04, + "learning_rate": 2.5101854414613895e-05, + "loss": 0.1528, + "step": 20910 + }, + { + "epoch": 2.05, + "learning_rate": 2.5097702740105176e-05, + "loss": 0.1125, + "step": 20915 + }, + { + "epoch": 2.05, + "learning_rate": 2.509355106559646e-05, + "loss": 0.1374, + "step": 20920 + }, + { + "epoch": 2.05, + "learning_rate": 2.508939939108774e-05, + "loss": 0.1356, + "step": 20925 + }, + { + "epoch": 2.05, + "learning_rate": 2.508524771657902e-05, + "loss": 0.1168, + "step": 20930 + }, + { + "epoch": 2.05, + "learning_rate": 2.5081096042070302e-05, + "loss": 0.1138, + "step": 20935 + }, + { + "epoch": 2.05, + "learning_rate": 2.5076944367561583e-05, + "loss": 0.1715, + "step": 20940 + }, + { + "epoch": 2.05, + "learning_rate": 2.5072792693052864e-05, + "loss": 0.1129, + "step": 20945 + }, + { + "epoch": 2.05, + "learning_rate": 2.5068641018544144e-05, + "loss": 0.1228, + "step": 20950 + }, + { + "epoch": 2.05, + "learning_rate": 2.506448934403543e-05, + "loss": 0.1466, + "step": 20955 + }, + { + "epoch": 2.05, + "learning_rate": 2.506033766952671e-05, + "loss": 0.1356, + "step": 20960 + }, + { + "epoch": 2.05, + "learning_rate": 2.5056185995017994e-05, + "loss": 0.1322, + "step": 20965 + }, + { + "epoch": 2.05, + "learning_rate": 2.5052034320509274e-05, + "loss": 0.13, + "step": 20970 + }, + { + "epoch": 2.05, + "learning_rate": 2.5047882646000555e-05, + "loss": 0.1536, + "step": 20975 + }, + { + "epoch": 2.05, + "learning_rate": 2.5043730971491836e-05, + "loss": 0.1169, + "step": 20980 + }, + { + "epoch": 2.05, + "learning_rate": 2.5039579296983117e-05, + "loss": 0.1429, + "step": 20985 + }, + { + "epoch": 2.05, + "learning_rate": 2.5035427622474397e-05, + "loss": 0.1692, + "step": 20990 + }, + { + "epoch": 2.05, + "learning_rate": 2.5031275947965678e-05, + "loss": 0.1407, + "step": 20995 + }, + { + "epoch": 2.05, + "learning_rate": 2.502712427345696e-05, + "loss": 0.129, + "step": 21000 + }, + { + "epoch": 2.05, + "eval_cer": 0.062419214236330296, + "eval_loss": 0.25887730717658997, + "eval_runtime": 271.5991, + "eval_samples_per_second": 60.273, + "eval_steps_per_second": 1.675, + "eval_wer": 0.15952410492154392, + "step": 21000 + }, + { + "epoch": 2.05, + "learning_rate": 2.5022972598948243e-05, + "loss": 0.1357, + "step": 21005 + }, + { + "epoch": 2.05, + "learning_rate": 2.5018820924439527e-05, + "loss": 0.1469, + "step": 21010 + }, + { + "epoch": 2.05, + "learning_rate": 2.5014669249930808e-05, + "loss": 0.1339, + "step": 21015 + }, + { + "epoch": 2.06, + "learning_rate": 2.501051757542209e-05, + "loss": 0.1598, + "step": 21020 + }, + { + "epoch": 2.06, + "learning_rate": 2.500636590091337e-05, + "loss": 0.1679, + "step": 21025 + }, + { + "epoch": 2.06, + "learning_rate": 2.500221422640465e-05, + "loss": 0.1272, + "step": 21030 + }, + { + "epoch": 2.06, + "learning_rate": 2.499806255189593e-05, + "loss": 0.1262, + "step": 21035 + }, + { + "epoch": 2.06, + "learning_rate": 2.4993910877387212e-05, + "loss": 0.1487, + "step": 21040 + }, + { + "epoch": 2.06, + "learning_rate": 2.4989759202878493e-05, + "loss": 0.1276, + "step": 21045 + }, + { + "epoch": 2.06, + "learning_rate": 2.4985607528369773e-05, + "loss": 0.1293, + "step": 21050 + }, + { + "epoch": 2.06, + "learning_rate": 2.498145585386106e-05, + "loss": 0.143, + "step": 21055 + }, + { + "epoch": 2.06, + "learning_rate": 2.4977304179352342e-05, + "loss": 0.1243, + "step": 21060 + }, + { + "epoch": 2.06, + "learning_rate": 2.4973152504843622e-05, + "loss": 0.1071, + "step": 21065 + }, + { + "epoch": 2.06, + "learning_rate": 2.4969000830334903e-05, + "loss": 0.1292, + "step": 21070 + }, + { + "epoch": 2.06, + "learning_rate": 2.4964849155826184e-05, + "loss": 0.1248, + "step": 21075 + }, + { + "epoch": 2.06, + "learning_rate": 2.4960697481317465e-05, + "loss": 0.1272, + "step": 21080 + }, + { + "epoch": 2.06, + "learning_rate": 2.4956545806808746e-05, + "loss": 0.1223, + "step": 21085 + }, + { + "epoch": 2.06, + "learning_rate": 2.4952394132300026e-05, + "loss": 0.1667, + "step": 21090 + }, + { + "epoch": 2.06, + "learning_rate": 2.4948242457791307e-05, + "loss": 0.1267, + "step": 21095 + }, + { + "epoch": 2.06, + "learning_rate": 2.494409078328259e-05, + "loss": 0.1264, + "step": 21100 + }, + { + "epoch": 2.06, + "learning_rate": 2.4939939108773875e-05, + "loss": 0.1438, + "step": 21105 + }, + { + "epoch": 2.06, + "learning_rate": 2.4935787434265156e-05, + "loss": 0.1338, + "step": 21110 + }, + { + "epoch": 2.06, + "learning_rate": 2.4931635759756437e-05, + "loss": 0.1264, + "step": 21115 + }, + { + "epoch": 2.07, + "learning_rate": 2.4927484085247718e-05, + "loss": 0.1313, + "step": 21120 + }, + { + "epoch": 2.07, + "learning_rate": 2.4923332410739e-05, + "loss": 0.1271, + "step": 21125 + }, + { + "epoch": 2.07, + "learning_rate": 2.491918073623028e-05, + "loss": 0.1097, + "step": 21130 + }, + { + "epoch": 2.07, + "learning_rate": 2.491502906172156e-05, + "loss": 0.1207, + "step": 21135 + }, + { + "epoch": 2.07, + "learning_rate": 2.4910877387212844e-05, + "loss": 0.1723, + "step": 21140 + }, + { + "epoch": 2.07, + "learning_rate": 2.4906725712704125e-05, + "loss": 0.12, + "step": 21145 + }, + { + "epoch": 2.07, + "learning_rate": 2.4902574038195406e-05, + "loss": 0.1299, + "step": 21150 + }, + { + "epoch": 2.07, + "learning_rate": 2.4898422363686686e-05, + "loss": 0.1661, + "step": 21155 + }, + { + "epoch": 2.07, + "learning_rate": 2.489427068917797e-05, + "loss": 0.1269, + "step": 21160 + }, + { + "epoch": 2.07, + "learning_rate": 2.489011901466925e-05, + "loss": 0.1372, + "step": 21165 + }, + { + "epoch": 2.07, + "learning_rate": 2.4885967340160532e-05, + "loss": 0.1408, + "step": 21170 + }, + { + "epoch": 2.07, + "learning_rate": 2.4881815665651813e-05, + "loss": 0.1381, + "step": 21175 + }, + { + "epoch": 2.07, + "learning_rate": 2.4877663991143094e-05, + "loss": 0.125, + "step": 21180 + }, + { + "epoch": 2.07, + "learning_rate": 2.4873512316634378e-05, + "loss": 0.1345, + "step": 21185 + }, + { + "epoch": 2.07, + "learning_rate": 2.486936064212566e-05, + "loss": 0.1548, + "step": 21190 + }, + { + "epoch": 2.07, + "learning_rate": 2.486520896761694e-05, + "loss": 0.1184, + "step": 21195 + }, + { + "epoch": 2.07, + "learning_rate": 2.486105729310822e-05, + "loss": 0.1343, + "step": 21200 + }, + { + "epoch": 2.07, + "learning_rate": 2.48569056185995e-05, + "loss": 0.1746, + "step": 21205 + }, + { + "epoch": 2.07, + "learning_rate": 2.4852753944090785e-05, + "loss": 0.1428, + "step": 21210 + }, + { + "epoch": 2.07, + "learning_rate": 2.4848602269582066e-05, + "loss": 0.1274, + "step": 21215 + }, + { + "epoch": 2.07, + "learning_rate": 2.4844450595073347e-05, + "loss": 0.1362, + "step": 21220 + }, + { + "epoch": 2.08, + "learning_rate": 2.4840298920564627e-05, + "loss": 0.1439, + "step": 21225 + }, + { + "epoch": 2.08, + "learning_rate": 2.483614724605591e-05, + "loss": 0.1376, + "step": 21230 + }, + { + "epoch": 2.08, + "learning_rate": 2.4831995571547192e-05, + "loss": 0.1307, + "step": 21235 + }, + { + "epoch": 2.08, + "learning_rate": 2.4827843897038473e-05, + "loss": 0.1404, + "step": 21240 + }, + { + "epoch": 2.08, + "learning_rate": 2.4823692222529754e-05, + "loss": 0.1403, + "step": 21245 + }, + { + "epoch": 2.08, + "learning_rate": 2.4819540548021035e-05, + "loss": 0.1287, + "step": 21250 + }, + { + "epoch": 2.08, + "learning_rate": 2.4815388873512315e-05, + "loss": 0.1397, + "step": 21255 + }, + { + "epoch": 2.08, + "learning_rate": 2.48112371990036e-05, + "loss": 0.157, + "step": 21260 + }, + { + "epoch": 2.08, + "learning_rate": 2.480708552449488e-05, + "loss": 0.1162, + "step": 21265 + }, + { + "epoch": 2.08, + "learning_rate": 2.480293384998616e-05, + "loss": 0.1342, + "step": 21270 + }, + { + "epoch": 2.08, + "learning_rate": 2.4798782175477445e-05, + "loss": 0.1432, + "step": 21275 + }, + { + "epoch": 2.08, + "learning_rate": 2.4794630500968726e-05, + "loss": 0.1328, + "step": 21280 + }, + { + "epoch": 2.08, + "learning_rate": 2.4790478826460007e-05, + "loss": 0.1196, + "step": 21285 + }, + { + "epoch": 2.08, + "learning_rate": 2.4786327151951288e-05, + "loss": 0.1546, + "step": 21290 + }, + { + "epoch": 2.08, + "learning_rate": 2.478217547744257e-05, + "loss": 0.1323, + "step": 21295 + }, + { + "epoch": 2.08, + "learning_rate": 2.477802380293385e-05, + "loss": 0.1247, + "step": 21300 + }, + { + "epoch": 2.08, + "learning_rate": 2.477387212842513e-05, + "loss": 0.1302, + "step": 21305 + }, + { + "epoch": 2.08, + "learning_rate": 2.4769720453916414e-05, + "loss": 0.1241, + "step": 21310 + }, + { + "epoch": 2.08, + "learning_rate": 2.4765568779407695e-05, + "loss": 0.136, + "step": 21315 + }, + { + "epoch": 2.08, + "learning_rate": 2.476141710489898e-05, + "loss": 0.1439, + "step": 21320 + }, + { + "epoch": 2.09, + "learning_rate": 2.475726543039026e-05, + "loss": 0.1391, + "step": 21325 + }, + { + "epoch": 2.09, + "learning_rate": 2.475311375588154e-05, + "loss": 0.1235, + "step": 21330 + }, + { + "epoch": 2.09, + "learning_rate": 2.474896208137282e-05, + "loss": 0.1287, + "step": 21335 + }, + { + "epoch": 2.09, + "learning_rate": 2.4744810406864102e-05, + "loss": 0.1416, + "step": 21340 + }, + { + "epoch": 2.09, + "learning_rate": 2.4740658732355383e-05, + "loss": 0.1315, + "step": 21345 + }, + { + "epoch": 2.09, + "learning_rate": 2.4736507057846664e-05, + "loss": 0.1363, + "step": 21350 + }, + { + "epoch": 2.09, + "learning_rate": 2.4732355383337944e-05, + "loss": 0.1403, + "step": 21355 + }, + { + "epoch": 2.09, + "learning_rate": 2.4728203708829225e-05, + "loss": 0.1203, + "step": 21360 + }, + { + "epoch": 2.09, + "learning_rate": 2.4724052034320513e-05, + "loss": 0.1298, + "step": 21365 + }, + { + "epoch": 2.09, + "learning_rate": 2.4719900359811793e-05, + "loss": 0.1233, + "step": 21370 + }, + { + "epoch": 2.09, + "learning_rate": 2.4715748685303074e-05, + "loss": 0.1518, + "step": 21375 + }, + { + "epoch": 2.09, + "learning_rate": 2.4711597010794355e-05, + "loss": 0.132, + "step": 21380 + }, + { + "epoch": 2.09, + "learning_rate": 2.4707445336285636e-05, + "loss": 0.1143, + "step": 21385 + }, + { + "epoch": 2.09, + "learning_rate": 2.4703293661776916e-05, + "loss": 0.1419, + "step": 21390 + }, + { + "epoch": 2.09, + "learning_rate": 2.4699141987268197e-05, + "loss": 0.1386, + "step": 21395 + }, + { + "epoch": 2.09, + "learning_rate": 2.4694990312759478e-05, + "loss": 0.1258, + "step": 21400 + }, + { + "epoch": 2.09, + "learning_rate": 2.4690838638250762e-05, + "loss": 0.1352, + "step": 21405 + }, + { + "epoch": 2.09, + "learning_rate": 2.4686686963742043e-05, + "loss": 0.124, + "step": 21410 + }, + { + "epoch": 2.09, + "learning_rate": 2.4682535289233327e-05, + "loss": 0.1292, + "step": 21415 + }, + { + "epoch": 2.09, + "learning_rate": 2.4678383614724608e-05, + "loss": 0.1515, + "step": 21420 + }, + { + "epoch": 2.1, + "learning_rate": 2.467423194021589e-05, + "loss": 0.1495, + "step": 21425 + }, + { + "epoch": 2.1, + "learning_rate": 2.467008026570717e-05, + "loss": 0.1237, + "step": 21430 + }, + { + "epoch": 2.1, + "learning_rate": 2.466592859119845e-05, + "loss": 0.1158, + "step": 21435 + }, + { + "epoch": 2.1, + "learning_rate": 2.466177691668973e-05, + "loss": 0.1493, + "step": 21440 + }, + { + "epoch": 2.1, + "learning_rate": 2.4657625242181012e-05, + "loss": 0.1077, + "step": 21445 + }, + { + "epoch": 2.1, + "learning_rate": 2.4653473567672296e-05, + "loss": 0.113, + "step": 21450 + }, + { + "epoch": 2.1, + "learning_rate": 2.4649321893163577e-05, + "loss": 0.1495, + "step": 21455 + }, + { + "epoch": 2.1, + "learning_rate": 2.4645170218654857e-05, + "loss": 0.1314, + "step": 21460 + }, + { + "epoch": 2.1, + "learning_rate": 2.464101854414614e-05, + "loss": 0.1165, + "step": 21465 + }, + { + "epoch": 2.1, + "learning_rate": 2.4636866869637422e-05, + "loss": 0.1186, + "step": 21470 + }, + { + "epoch": 2.1, + "learning_rate": 2.4632715195128703e-05, + "loss": 0.139, + "step": 21475 + }, + { + "epoch": 2.1, + "learning_rate": 2.4628563520619984e-05, + "loss": 0.1255, + "step": 21480 + }, + { + "epoch": 2.1, + "learning_rate": 2.4624411846111265e-05, + "loss": 0.1226, + "step": 21485 + }, + { + "epoch": 2.1, + "learning_rate": 2.4620260171602545e-05, + "loss": 0.1603, + "step": 21490 + }, + { + "epoch": 2.1, + "learning_rate": 2.461610849709383e-05, + "loss": 0.1172, + "step": 21495 + }, + { + "epoch": 2.1, + "learning_rate": 2.461195682258511e-05, + "loss": 0.1198, + "step": 21500 + }, + { + "epoch": 2.1, + "eval_cer": 0.0631233076899954, + "eval_loss": 0.26294419169425964, + "eval_runtime": 278.9164, + "eval_samples_per_second": 58.691, + "eval_steps_per_second": 1.631, + "eval_wer": 0.1628608555402467, + "step": 21500 + }, + { + "epoch": 2.1, + "learning_rate": 2.460780514807639e-05, + "loss": 0.1637, + "step": 21505 + }, + { + "epoch": 2.1, + "learning_rate": 2.4603653473567672e-05, + "loss": 0.1365, + "step": 21510 + }, + { + "epoch": 2.1, + "learning_rate": 2.4599501799058956e-05, + "loss": 0.1226, + "step": 21515 + }, + { + "epoch": 2.1, + "learning_rate": 2.4595350124550237e-05, + "loss": 0.1571, + "step": 21520 + }, + { + "epoch": 2.1, + "learning_rate": 2.4591198450041518e-05, + "loss": 0.1347, + "step": 21525 + }, + { + "epoch": 2.11, + "learning_rate": 2.45870467755328e-05, + "loss": 0.1075, + "step": 21530 + }, + { + "epoch": 2.11, + "learning_rate": 2.458289510102408e-05, + "loss": 0.1337, + "step": 21535 + }, + { + "epoch": 2.11, + "learning_rate": 2.4578743426515363e-05, + "loss": 0.1491, + "step": 21540 + }, + { + "epoch": 2.11, + "learning_rate": 2.4574591752006644e-05, + "loss": 0.1262, + "step": 21545 + }, + { + "epoch": 2.11, + "learning_rate": 2.4570440077497925e-05, + "loss": 0.1235, + "step": 21550 + }, + { + "epoch": 2.11, + "learning_rate": 2.4566288402989206e-05, + "loss": 0.1504, + "step": 21555 + }, + { + "epoch": 2.11, + "learning_rate": 2.4562136728480486e-05, + "loss": 0.1302, + "step": 21560 + }, + { + "epoch": 2.11, + "learning_rate": 2.4557985053971767e-05, + "loss": 0.1305, + "step": 21565 + }, + { + "epoch": 2.11, + "learning_rate": 2.455383337946305e-05, + "loss": 0.1327, + "step": 21570 + }, + { + "epoch": 2.11, + "learning_rate": 2.4549681704954332e-05, + "loss": 0.1642, + "step": 21575 + }, + { + "epoch": 2.11, + "learning_rate": 2.4545530030445613e-05, + "loss": 0.1203, + "step": 21580 + }, + { + "epoch": 2.11, + "learning_rate": 2.4541378355936897e-05, + "loss": 0.125, + "step": 21585 + }, + { + "epoch": 2.11, + "learning_rate": 2.4537226681428178e-05, + "loss": 0.1603, + "step": 21590 + }, + { + "epoch": 2.11, + "learning_rate": 2.453307500691946e-05, + "loss": 0.12, + "step": 21595 + }, + { + "epoch": 2.11, + "learning_rate": 2.452892333241074e-05, + "loss": 0.1101, + "step": 21600 + }, + { + "epoch": 2.11, + "learning_rate": 2.452477165790202e-05, + "loss": 0.1338, + "step": 21605 + }, + { + "epoch": 2.11, + "learning_rate": 2.45206199833933e-05, + "loss": 0.1303, + "step": 21610 + }, + { + "epoch": 2.11, + "learning_rate": 2.451646830888458e-05, + "loss": 0.1164, + "step": 21615 + }, + { + "epoch": 2.11, + "learning_rate": 2.4512316634375866e-05, + "loss": 0.1444, + "step": 21620 + }, + { + "epoch": 2.11, + "learning_rate": 2.450816495986715e-05, + "loss": 0.1309, + "step": 21625 + }, + { + "epoch": 2.12, + "learning_rate": 2.450401328535843e-05, + "loss": 0.1392, + "step": 21630 + }, + { + "epoch": 2.12, + "learning_rate": 2.449986161084971e-05, + "loss": 0.1105, + "step": 21635 + }, + { + "epoch": 2.12, + "learning_rate": 2.4495709936340992e-05, + "loss": 0.1432, + "step": 21640 + }, + { + "epoch": 2.12, + "learning_rate": 2.4491558261832273e-05, + "loss": 0.1212, + "step": 21645 + }, + { + "epoch": 2.12, + "learning_rate": 2.4487406587323554e-05, + "loss": 0.1117, + "step": 21650 + }, + { + "epoch": 2.12, + "learning_rate": 2.4483254912814834e-05, + "loss": 0.1643, + "step": 21655 + }, + { + "epoch": 2.12, + "learning_rate": 2.4479103238306115e-05, + "loss": 0.1206, + "step": 21660 + }, + { + "epoch": 2.12, + "learning_rate": 2.4474951563797396e-05, + "loss": 0.1163, + "step": 21665 + }, + { + "epoch": 2.12, + "learning_rate": 2.4470799889288684e-05, + "loss": 0.139, + "step": 21670 + }, + { + "epoch": 2.12, + "learning_rate": 2.4466648214779964e-05, + "loss": 0.1379, + "step": 21675 + }, + { + "epoch": 2.12, + "learning_rate": 2.4462496540271245e-05, + "loss": 0.1031, + "step": 21680 + }, + { + "epoch": 2.12, + "learning_rate": 2.4458344865762526e-05, + "loss": 0.1455, + "step": 21685 + }, + { + "epoch": 2.12, + "learning_rate": 2.4454193191253807e-05, + "loss": 0.1555, + "step": 21690 + }, + { + "epoch": 2.12, + "learning_rate": 2.4450041516745087e-05, + "loss": 0.1324, + "step": 21695 + }, + { + "epoch": 2.12, + "learning_rate": 2.4445889842236368e-05, + "loss": 0.1074, + "step": 21700 + }, + { + "epoch": 2.12, + "learning_rate": 2.444173816772765e-05, + "loss": 0.1173, + "step": 21705 + }, + { + "epoch": 2.12, + "learning_rate": 2.443758649321893e-05, + "loss": 0.133, + "step": 21710 + }, + { + "epoch": 2.12, + "learning_rate": 2.4433434818710214e-05, + "loss": 0.1224, + "step": 21715 + }, + { + "epoch": 2.12, + "learning_rate": 2.4429283144201498e-05, + "loss": 0.1433, + "step": 21720 + }, + { + "epoch": 2.12, + "learning_rate": 2.442513146969278e-05, + "loss": 0.1366, + "step": 21725 + }, + { + "epoch": 2.12, + "learning_rate": 2.442097979518406e-05, + "loss": 0.1213, + "step": 21730 + }, + { + "epoch": 2.13, + "learning_rate": 2.441682812067534e-05, + "loss": 0.1274, + "step": 21735 + }, + { + "epoch": 2.13, + "learning_rate": 2.441267644616662e-05, + "loss": 0.1423, + "step": 21740 + }, + { + "epoch": 2.13, + "learning_rate": 2.4408524771657902e-05, + "loss": 0.1175, + "step": 21745 + }, + { + "epoch": 2.13, + "learning_rate": 2.4404373097149183e-05, + "loss": 0.1066, + "step": 21750 + }, + { + "epoch": 2.13, + "learning_rate": 2.4400221422640463e-05, + "loss": 0.1394, + "step": 21755 + }, + { + "epoch": 2.13, + "learning_rate": 2.4396069748131748e-05, + "loss": 0.1284, + "step": 21760 + }, + { + "epoch": 2.13, + "learning_rate": 2.439191807362303e-05, + "loss": 0.1197, + "step": 21765 + }, + { + "epoch": 2.13, + "learning_rate": 2.438776639911431e-05, + "loss": 0.1194, + "step": 21770 + }, + { + "epoch": 2.13, + "learning_rate": 2.4383614724605593e-05, + "loss": 0.1398, + "step": 21775 + }, + { + "epoch": 2.13, + "learning_rate": 2.4379463050096874e-05, + "loss": 0.1194, + "step": 21780 + }, + { + "epoch": 2.13, + "learning_rate": 2.4375311375588155e-05, + "loss": 0.1313, + "step": 21785 + }, + { + "epoch": 2.13, + "learning_rate": 2.4371159701079436e-05, + "loss": 0.1763, + "step": 21790 + }, + { + "epoch": 2.13, + "learning_rate": 2.4367008026570716e-05, + "loss": 0.1164, + "step": 21795 + }, + { + "epoch": 2.13, + "learning_rate": 2.4362856352061997e-05, + "loss": 0.0998, + "step": 21800 + }, + { + "epoch": 2.13, + "learning_rate": 2.435870467755328e-05, + "loss": 0.1656, + "step": 21805 + }, + { + "epoch": 2.13, + "learning_rate": 2.4354553003044562e-05, + "loss": 0.1292, + "step": 21810 + }, + { + "epoch": 2.13, + "learning_rate": 2.4350401328535843e-05, + "loss": 0.118, + "step": 21815 + }, + { + "epoch": 2.13, + "learning_rate": 2.4346249654027124e-05, + "loss": 0.1095, + "step": 21820 + }, + { + "epoch": 2.13, + "learning_rate": 2.4342097979518408e-05, + "loss": 0.1387, + "step": 21825 + }, + { + "epoch": 2.13, + "learning_rate": 2.433794630500969e-05, + "loss": 0.1318, + "step": 21830 + }, + { + "epoch": 2.14, + "learning_rate": 2.433379463050097e-05, + "loss": 0.1262, + "step": 21835 + }, + { + "epoch": 2.14, + "learning_rate": 2.432964295599225e-05, + "loss": 0.1471, + "step": 21840 + }, + { + "epoch": 2.14, + "learning_rate": 2.4325491281483534e-05, + "loss": 0.1224, + "step": 21845 + }, + { + "epoch": 2.14, + "learning_rate": 2.4321339606974815e-05, + "loss": 0.1102, + "step": 21850 + }, + { + "epoch": 2.14, + "learning_rate": 2.4317187932466096e-05, + "loss": 0.1419, + "step": 21855 + }, + { + "epoch": 2.14, + "learning_rate": 2.4313036257957376e-05, + "loss": 0.125, + "step": 21860 + }, + { + "epoch": 2.14, + "learning_rate": 2.4308884583448657e-05, + "loss": 0.1266, + "step": 21865 + }, + { + "epoch": 2.14, + "learning_rate": 2.4304732908939938e-05, + "loss": 0.1404, + "step": 21870 + }, + { + "epoch": 2.14, + "learning_rate": 2.4300581234431222e-05, + "loss": 0.1386, + "step": 21875 + }, + { + "epoch": 2.14, + "learning_rate": 2.4296429559922503e-05, + "loss": 0.1289, + "step": 21880 + }, + { + "epoch": 2.14, + "learning_rate": 2.4292277885413784e-05, + "loss": 0.1328, + "step": 21885 + }, + { + "epoch": 2.14, + "learning_rate": 2.4288126210905068e-05, + "loss": 0.1501, + "step": 21890 + }, + { + "epoch": 2.14, + "learning_rate": 2.428397453639635e-05, + "loss": 0.1451, + "step": 21895 + }, + { + "epoch": 2.14, + "learning_rate": 2.427982286188763e-05, + "loss": 0.1065, + "step": 21900 + }, + { + "epoch": 2.14, + "learning_rate": 2.427567118737891e-05, + "loss": 0.1398, + "step": 21905 + }, + { + "epoch": 2.14, + "learning_rate": 2.427151951287019e-05, + "loss": 0.1129, + "step": 21910 + }, + { + "epoch": 2.14, + "learning_rate": 2.426736783836147e-05, + "loss": 0.1284, + "step": 21915 + }, + { + "epoch": 2.14, + "learning_rate": 2.4263216163852752e-05, + "loss": 0.1167, + "step": 21920 + }, + { + "epoch": 2.14, + "learning_rate": 2.4259064489344037e-05, + "loss": 0.1455, + "step": 21925 + }, + { + "epoch": 2.14, + "learning_rate": 2.4254912814835317e-05, + "loss": 0.1106, + "step": 21930 + }, + { + "epoch": 2.14, + "learning_rate": 2.42507611403266e-05, + "loss": 0.133, + "step": 21935 + }, + { + "epoch": 2.15, + "learning_rate": 2.4246609465817882e-05, + "loss": 0.1531, + "step": 21940 + }, + { + "epoch": 2.15, + "learning_rate": 2.4242457791309163e-05, + "loss": 0.1274, + "step": 21945 + }, + { + "epoch": 2.15, + "learning_rate": 2.4238306116800444e-05, + "loss": 0.1024, + "step": 21950 + }, + { + "epoch": 2.15, + "learning_rate": 2.4234154442291725e-05, + "loss": 0.1464, + "step": 21955 + }, + { + "epoch": 2.15, + "learning_rate": 2.4230002767783005e-05, + "loss": 0.1306, + "step": 21960 + }, + { + "epoch": 2.15, + "learning_rate": 2.4225851093274286e-05, + "loss": 0.1222, + "step": 21965 + }, + { + "epoch": 2.15, + "learning_rate": 2.4221699418765567e-05, + "loss": 0.1537, + "step": 21970 + }, + { + "epoch": 2.15, + "learning_rate": 2.4217547744256848e-05, + "loss": 0.1392, + "step": 21975 + }, + { + "epoch": 2.15, + "learning_rate": 2.4213396069748135e-05, + "loss": 0.1179, + "step": 21980 + }, + { + "epoch": 2.15, + "learning_rate": 2.4209244395239416e-05, + "loss": 0.1173, + "step": 21985 + }, + { + "epoch": 2.15, + "learning_rate": 2.4205092720730697e-05, + "loss": 0.1504, + "step": 21990 + }, + { + "epoch": 2.15, + "learning_rate": 2.4200941046221978e-05, + "loss": 0.1164, + "step": 21995 + }, + { + "epoch": 2.15, + "learning_rate": 2.4196789371713258e-05, + "loss": 0.1083, + "step": 22000 + }, + { + "epoch": 2.15, + "eval_cer": 0.0626990017827785, + "eval_loss": 0.2608412206172943, + "eval_runtime": 273.5215, + "eval_samples_per_second": 59.849, + "eval_steps_per_second": 1.663, + "eval_wer": 0.16037951457134836, + "step": 22000 + }, + { + "epoch": 2.15, + "learning_rate": 2.419263769720454e-05, + "loss": 0.129, + "step": 22005 + }, + { + "epoch": 2.15, + "learning_rate": 2.418848602269582e-05, + "loss": 0.1257, + "step": 22010 + }, + { + "epoch": 2.15, + "learning_rate": 2.41843343481871e-05, + "loss": 0.1187, + "step": 22015 + }, + { + "epoch": 2.15, + "learning_rate": 2.418018267367838e-05, + "loss": 0.1552, + "step": 22020 + }, + { + "epoch": 2.15, + "learning_rate": 2.4176030999169666e-05, + "loss": 0.1564, + "step": 22025 + }, + { + "epoch": 2.15, + "learning_rate": 2.417187932466095e-05, + "loss": 0.1292, + "step": 22030 + }, + { + "epoch": 2.15, + "learning_rate": 2.416772765015223e-05, + "loss": 0.1238, + "step": 22035 + }, + { + "epoch": 2.16, + "learning_rate": 2.416357597564351e-05, + "loss": 0.1352, + "step": 22040 + }, + { + "epoch": 2.16, + "learning_rate": 2.4159424301134792e-05, + "loss": 0.1191, + "step": 22045 + }, + { + "epoch": 2.16, + "learning_rate": 2.4155272626626073e-05, + "loss": 0.1268, + "step": 22050 + }, + { + "epoch": 2.16, + "learning_rate": 2.4151120952117354e-05, + "loss": 0.156, + "step": 22055 + }, + { + "epoch": 2.16, + "learning_rate": 2.4146969277608634e-05, + "loss": 0.1438, + "step": 22060 + }, + { + "epoch": 2.16, + "learning_rate": 2.4142817603099915e-05, + "loss": 0.1236, + "step": 22065 + }, + { + "epoch": 2.16, + "learning_rate": 2.41386659285912e-05, + "loss": 0.144, + "step": 22070 + }, + { + "epoch": 2.16, + "learning_rate": 2.413451425408248e-05, + "loss": 0.1361, + "step": 22075 + }, + { + "epoch": 2.16, + "learning_rate": 2.4130362579573764e-05, + "loss": 0.1145, + "step": 22080 + }, + { + "epoch": 2.16, + "learning_rate": 2.4126210905065045e-05, + "loss": 0.1285, + "step": 22085 + }, + { + "epoch": 2.16, + "learning_rate": 2.4122059230556326e-05, + "loss": 0.1475, + "step": 22090 + }, + { + "epoch": 2.16, + "learning_rate": 2.4117907556047606e-05, + "loss": 0.1239, + "step": 22095 + }, + { + "epoch": 2.16, + "learning_rate": 2.4113755881538887e-05, + "loss": 0.1159, + "step": 22100 + }, + { + "epoch": 2.16, + "learning_rate": 2.4109604207030168e-05, + "loss": 0.1339, + "step": 22105 + }, + { + "epoch": 2.16, + "learning_rate": 2.4105452532521452e-05, + "loss": 0.134, + "step": 22110 + }, + { + "epoch": 2.16, + "learning_rate": 2.4101300858012733e-05, + "loss": 0.1177, + "step": 22115 + }, + { + "epoch": 2.16, + "learning_rate": 2.4097149183504014e-05, + "loss": 0.1441, + "step": 22120 + }, + { + "epoch": 2.16, + "learning_rate": 2.4092997508995294e-05, + "loss": 0.1408, + "step": 22125 + }, + { + "epoch": 2.16, + "learning_rate": 2.408884583448658e-05, + "loss": 0.1163, + "step": 22130 + }, + { + "epoch": 2.16, + "learning_rate": 2.408469415997786e-05, + "loss": 0.1158, + "step": 22135 + }, + { + "epoch": 2.16, + "learning_rate": 2.408054248546914e-05, + "loss": 0.1464, + "step": 22140 + }, + { + "epoch": 2.17, + "learning_rate": 2.407639081096042e-05, + "loss": 0.1276, + "step": 22145 + }, + { + "epoch": 2.17, + "learning_rate": 2.40722391364517e-05, + "loss": 0.1082, + "step": 22150 + }, + { + "epoch": 2.17, + "learning_rate": 2.4068087461942986e-05, + "loss": 0.1413, + "step": 22155 + }, + { + "epoch": 2.17, + "learning_rate": 2.4063935787434267e-05, + "loss": 0.1153, + "step": 22160 + }, + { + "epoch": 2.17, + "learning_rate": 2.4059784112925547e-05, + "loss": 0.1157, + "step": 22165 + }, + { + "epoch": 2.17, + "learning_rate": 2.4055632438416828e-05, + "loss": 0.1368, + "step": 22170 + }, + { + "epoch": 2.17, + "learning_rate": 2.405148076390811e-05, + "loss": 0.1396, + "step": 22175 + }, + { + "epoch": 2.17, + "learning_rate": 2.404732908939939e-05, + "loss": 0.1338, + "step": 22180 + }, + { + "epoch": 2.17, + "learning_rate": 2.4043177414890674e-05, + "loss": 0.1376, + "step": 22185 + }, + { + "epoch": 2.17, + "learning_rate": 2.4039025740381955e-05, + "loss": 0.1447, + "step": 22190 + }, + { + "epoch": 2.17, + "learning_rate": 2.4034874065873235e-05, + "loss": 0.1322, + "step": 22195 + }, + { + "epoch": 2.17, + "learning_rate": 2.403072239136452e-05, + "loss": 0.1206, + "step": 22200 + }, + { + "epoch": 2.17, + "learning_rate": 2.40265707168558e-05, + "loss": 0.1376, + "step": 22205 + }, + { + "epoch": 2.17, + "learning_rate": 2.402241904234708e-05, + "loss": 0.1411, + "step": 22210 + }, + { + "epoch": 2.17, + "learning_rate": 2.4018267367838362e-05, + "loss": 0.1347, + "step": 22215 + }, + { + "epoch": 2.17, + "learning_rate": 2.4014115693329643e-05, + "loss": 0.131, + "step": 22220 + }, + { + "epoch": 2.17, + "learning_rate": 2.4009964018820923e-05, + "loss": 0.1324, + "step": 22225 + }, + { + "epoch": 2.17, + "learning_rate": 2.4005812344312204e-05, + "loss": 0.1336, + "step": 22230 + }, + { + "epoch": 2.17, + "learning_rate": 2.4001660669803488e-05, + "loss": 0.1454, + "step": 22235 + }, + { + "epoch": 2.17, + "learning_rate": 2.399750899529477e-05, + "loss": 0.1646, + "step": 22240 + }, + { + "epoch": 2.18, + "learning_rate": 2.3993357320786053e-05, + "loss": 0.1206, + "step": 22245 + }, + { + "epoch": 2.18, + "learning_rate": 2.3989205646277334e-05, + "loss": 0.1152, + "step": 22250 + }, + { + "epoch": 2.18, + "learning_rate": 2.3985053971768615e-05, + "loss": 0.1443, + "step": 22255 + }, + { + "epoch": 2.18, + "learning_rate": 2.3980902297259896e-05, + "loss": 0.1353, + "step": 22260 + }, + { + "epoch": 2.18, + "learning_rate": 2.3976750622751176e-05, + "loss": 0.1243, + "step": 22265 + }, + { + "epoch": 2.18, + "learning_rate": 2.3972598948242457e-05, + "loss": 0.1567, + "step": 22270 + }, + { + "epoch": 2.18, + "learning_rate": 2.3968447273733738e-05, + "loss": 0.1461, + "step": 22275 + }, + { + "epoch": 2.18, + "learning_rate": 2.396429559922502e-05, + "loss": 0.1318, + "step": 22280 + }, + { + "epoch": 2.18, + "learning_rate": 2.3960143924716303e-05, + "loss": 0.1132, + "step": 22285 + }, + { + "epoch": 2.18, + "learning_rate": 2.3955992250207587e-05, + "loss": 0.1472, + "step": 22290 + }, + { + "epoch": 2.18, + "learning_rate": 2.3951840575698868e-05, + "loss": 0.1258, + "step": 22295 + }, + { + "epoch": 2.18, + "learning_rate": 2.394768890119015e-05, + "loss": 0.1141, + "step": 22300 + }, + { + "epoch": 2.18, + "learning_rate": 2.394353722668143e-05, + "loss": 0.1467, + "step": 22305 + }, + { + "epoch": 2.18, + "learning_rate": 2.393938555217271e-05, + "loss": 0.1374, + "step": 22310 + }, + { + "epoch": 2.18, + "learning_rate": 2.393523387766399e-05, + "loss": 0.1163, + "step": 22315 + }, + { + "epoch": 2.18, + "learning_rate": 2.393108220315527e-05, + "loss": 0.1217, + "step": 22320 + }, + { + "epoch": 2.18, + "learning_rate": 2.3926930528646552e-05, + "loss": 0.131, + "step": 22325 + }, + { + "epoch": 2.18, + "learning_rate": 2.3922778854137836e-05, + "loss": 0.107, + "step": 22330 + }, + { + "epoch": 2.18, + "learning_rate": 2.391862717962912e-05, + "loss": 0.1251, + "step": 22335 + }, + { + "epoch": 2.18, + "learning_rate": 2.39144755051204e-05, + "loss": 0.1428, + "step": 22340 + }, + { + "epoch": 2.18, + "learning_rate": 2.3910323830611682e-05, + "loss": 0.1146, + "step": 22345 + }, + { + "epoch": 2.19, + "learning_rate": 2.3906172156102963e-05, + "loss": 0.0951, + "step": 22350 + }, + { + "epoch": 2.19, + "learning_rate": 2.3902020481594244e-05, + "loss": 0.138, + "step": 22355 + }, + { + "epoch": 2.19, + "learning_rate": 2.3897868807085524e-05, + "loss": 0.1192, + "step": 22360 + }, + { + "epoch": 2.19, + "learning_rate": 2.3893717132576805e-05, + "loss": 0.1097, + "step": 22365 + }, + { + "epoch": 2.19, + "learning_rate": 2.3889565458068086e-05, + "loss": 0.1183, + "step": 22370 + }, + { + "epoch": 2.19, + "learning_rate": 2.388541378355937e-05, + "loss": 0.135, + "step": 22375 + }, + { + "epoch": 2.19, + "learning_rate": 2.388126210905065e-05, + "loss": 0.1167, + "step": 22380 + }, + { + "epoch": 2.19, + "learning_rate": 2.387711043454193e-05, + "loss": 0.1347, + "step": 22385 + }, + { + "epoch": 2.19, + "learning_rate": 2.3872958760033216e-05, + "loss": 0.1513, + "step": 22390 + }, + { + "epoch": 2.19, + "learning_rate": 2.3868807085524497e-05, + "loss": 0.1247, + "step": 22395 + }, + { + "epoch": 2.19, + "learning_rate": 2.3864655411015777e-05, + "loss": 0.1126, + "step": 22400 + }, + { + "epoch": 2.19, + "learning_rate": 2.3860503736507058e-05, + "loss": 0.1599, + "step": 22405 + }, + { + "epoch": 2.19, + "learning_rate": 2.385635206199834e-05, + "loss": 0.1158, + "step": 22410 + }, + { + "epoch": 2.19, + "learning_rate": 2.385220038748962e-05, + "loss": 0.1355, + "step": 22415 + }, + { + "epoch": 2.19, + "learning_rate": 2.3848048712980904e-05, + "loss": 0.1548, + "step": 22420 + }, + { + "epoch": 2.19, + "learning_rate": 2.3843897038472185e-05, + "loss": 0.1407, + "step": 22425 + }, + { + "epoch": 2.19, + "learning_rate": 2.3839745363963465e-05, + "loss": 0.1168, + "step": 22430 + }, + { + "epoch": 2.19, + "learning_rate": 2.3835593689454746e-05, + "loss": 0.1285, + "step": 22435 + }, + { + "epoch": 2.19, + "learning_rate": 2.383144201494603e-05, + "loss": 0.144, + "step": 22440 + }, + { + "epoch": 2.19, + "learning_rate": 2.382729034043731e-05, + "loss": 0.1256, + "step": 22445 + }, + { + "epoch": 2.2, + "learning_rate": 2.3823138665928592e-05, + "loss": 0.129, + "step": 22450 + }, + { + "epoch": 2.2, + "learning_rate": 2.3818986991419873e-05, + "loss": 0.1615, + "step": 22455 + }, + { + "epoch": 2.2, + "learning_rate": 2.3814835316911153e-05, + "loss": 0.1257, + "step": 22460 + }, + { + "epoch": 2.2, + "learning_rate": 2.3810683642402438e-05, + "loss": 0.1215, + "step": 22465 + }, + { + "epoch": 2.2, + "learning_rate": 2.3806531967893718e-05, + "loss": 0.1201, + "step": 22470 + }, + { + "epoch": 2.2, + "learning_rate": 2.3802380293385e-05, + "loss": 0.1291, + "step": 22475 + }, + { + "epoch": 2.2, + "learning_rate": 2.379822861887628e-05, + "loss": 0.1067, + "step": 22480 + }, + { + "epoch": 2.2, + "learning_rate": 2.379407694436756e-05, + "loss": 0.1275, + "step": 22485 + }, + { + "epoch": 2.2, + "learning_rate": 2.3789925269858845e-05, + "loss": 0.1423, + "step": 22490 + }, + { + "epoch": 2.2, + "learning_rate": 2.3785773595350126e-05, + "loss": 0.1233, + "step": 22495 + }, + { + "epoch": 2.2, + "learning_rate": 2.3781621920841406e-05, + "loss": 0.1446, + "step": 22500 + }, + { + "epoch": 2.2, + "eval_cer": 0.06288976601899318, + "eval_loss": 0.2597942054271698, + "eval_runtime": 278.6319, + "eval_samples_per_second": 58.751, + "eval_steps_per_second": 1.633, + "eval_wer": 0.1613524614249427, + "step": 22500 + }, + { + "epoch": 2.2, + "learning_rate": 2.3777470246332687e-05, + "loss": 0.1572, + "step": 22505 + }, + { + "epoch": 2.2, + "learning_rate": 2.377331857182397e-05, + "loss": 0.1346, + "step": 22510 + }, + { + "epoch": 2.2, + "learning_rate": 2.3769166897315252e-05, + "loss": 0.1063, + "step": 22515 + }, + { + "epoch": 2.2, + "learning_rate": 2.3765015222806533e-05, + "loss": 0.1377, + "step": 22520 + }, + { + "epoch": 2.2, + "learning_rate": 2.3760863548297814e-05, + "loss": 0.1372, + "step": 22525 + }, + { + "epoch": 2.2, + "learning_rate": 2.3756711873789094e-05, + "loss": 0.1164, + "step": 22530 + }, + { + "epoch": 2.2, + "learning_rate": 2.3752560199280375e-05, + "loss": 0.1446, + "step": 22535 + }, + { + "epoch": 2.2, + "learning_rate": 2.374840852477166e-05, + "loss": 0.138, + "step": 22540 + }, + { + "epoch": 2.2, + "learning_rate": 2.374425685026294e-05, + "loss": 0.1315, + "step": 22545 + }, + { + "epoch": 2.21, + "learning_rate": 2.3740105175754224e-05, + "loss": 0.1294, + "step": 22550 + }, + { + "epoch": 2.21, + "learning_rate": 2.3735953501245505e-05, + "loss": 0.1457, + "step": 22555 + }, + { + "epoch": 2.21, + "learning_rate": 2.3731801826736786e-05, + "loss": 0.1331, + "step": 22560 + }, + { + "epoch": 2.21, + "learning_rate": 2.3727650152228066e-05, + "loss": 0.1117, + "step": 22565 + }, + { + "epoch": 2.21, + "learning_rate": 2.3723498477719347e-05, + "loss": 0.1141, + "step": 22570 + }, + { + "epoch": 2.21, + "learning_rate": 2.3719346803210628e-05, + "loss": 0.1475, + "step": 22575 + }, + { + "epoch": 2.21, + "learning_rate": 2.371519512870191e-05, + "loss": 0.1429, + "step": 22580 + }, + { + "epoch": 2.21, + "learning_rate": 2.371104345419319e-05, + "loss": 0.1414, + "step": 22585 + }, + { + "epoch": 2.21, + "learning_rate": 2.370689177968447e-05, + "loss": 0.1461, + "step": 22590 + }, + { + "epoch": 2.21, + "learning_rate": 2.3702740105175758e-05, + "loss": 0.1224, + "step": 22595 + }, + { + "epoch": 2.21, + "learning_rate": 2.369858843066704e-05, + "loss": 0.1277, + "step": 22600 + }, + { + "epoch": 2.21, + "learning_rate": 2.369443675615832e-05, + "loss": 0.1583, + "step": 22605 + }, + { + "epoch": 2.21, + "learning_rate": 2.36902850816496e-05, + "loss": 0.1319, + "step": 22610 + }, + { + "epoch": 2.21, + "learning_rate": 2.368613340714088e-05, + "loss": 0.1082, + "step": 22615 + }, + { + "epoch": 2.21, + "learning_rate": 2.368198173263216e-05, + "loss": 0.1431, + "step": 22620 + }, + { + "epoch": 2.21, + "learning_rate": 2.3677830058123442e-05, + "loss": 0.1418, + "step": 22625 + }, + { + "epoch": 2.21, + "learning_rate": 2.3673678383614723e-05, + "loss": 0.1325, + "step": 22630 + }, + { + "epoch": 2.21, + "learning_rate": 2.3669526709106004e-05, + "loss": 0.1216, + "step": 22635 + }, + { + "epoch": 2.21, + "learning_rate": 2.3665375034597288e-05, + "loss": 0.1456, + "step": 22640 + }, + { + "epoch": 2.21, + "learning_rate": 2.3661223360088572e-05, + "loss": 0.1046, + "step": 22645 + }, + { + "epoch": 2.21, + "learning_rate": 2.3657071685579853e-05, + "loss": 0.1257, + "step": 22650 + }, + { + "epoch": 2.22, + "learning_rate": 2.3652920011071134e-05, + "loss": 0.1234, + "step": 22655 + }, + { + "epoch": 2.22, + "learning_rate": 2.3648768336562415e-05, + "loss": 0.1306, + "step": 22660 + }, + { + "epoch": 2.22, + "learning_rate": 2.3644616662053695e-05, + "loss": 0.1265, + "step": 22665 + }, + { + "epoch": 2.22, + "learning_rate": 2.3640464987544976e-05, + "loss": 0.1318, + "step": 22670 + }, + { + "epoch": 2.22, + "learning_rate": 2.3636313313036257e-05, + "loss": 0.1476, + "step": 22675 + }, + { + "epoch": 2.22, + "learning_rate": 2.3632161638527538e-05, + "loss": 0.1195, + "step": 22680 + }, + { + "epoch": 2.22, + "learning_rate": 2.3628009964018822e-05, + "loss": 0.1323, + "step": 22685 + }, + { + "epoch": 2.22, + "learning_rate": 2.3623858289510103e-05, + "loss": 0.1441, + "step": 22690 + }, + { + "epoch": 2.22, + "learning_rate": 2.3619706615001387e-05, + "loss": 0.1287, + "step": 22695 + }, + { + "epoch": 2.22, + "learning_rate": 2.3615554940492668e-05, + "loss": 0.1152, + "step": 22700 + }, + { + "epoch": 2.22, + "learning_rate": 2.3611403265983948e-05, + "loss": 0.1421, + "step": 22705 + }, + { + "epoch": 2.22, + "learning_rate": 2.360725159147523e-05, + "loss": 0.1323, + "step": 22710 + }, + { + "epoch": 2.22, + "learning_rate": 2.360309991696651e-05, + "loss": 0.1168, + "step": 22715 + }, + { + "epoch": 2.22, + "learning_rate": 2.359894824245779e-05, + "loss": 0.1359, + "step": 22720 + }, + { + "epoch": 2.22, + "learning_rate": 2.359479656794907e-05, + "loss": 0.1575, + "step": 22725 + }, + { + "epoch": 2.22, + "learning_rate": 2.3590644893440356e-05, + "loss": 0.1176, + "step": 22730 + }, + { + "epoch": 2.22, + "learning_rate": 2.3586493218931636e-05, + "loss": 0.132, + "step": 22735 + }, + { + "epoch": 2.22, + "learning_rate": 2.3582341544422917e-05, + "loss": 0.1316, + "step": 22740 + }, + { + "epoch": 2.22, + "learning_rate": 2.35781898699142e-05, + "loss": 0.1352, + "step": 22745 + }, + { + "epoch": 2.22, + "learning_rate": 2.3574038195405482e-05, + "loss": 0.1235, + "step": 22750 + }, + { + "epoch": 2.23, + "learning_rate": 2.3569886520896763e-05, + "loss": 0.1503, + "step": 22755 + }, + { + "epoch": 2.23, + "learning_rate": 2.3565734846388044e-05, + "loss": 0.1303, + "step": 22760 + }, + { + "epoch": 2.23, + "learning_rate": 2.3561583171879324e-05, + "loss": 0.1179, + "step": 22765 + }, + { + "epoch": 2.23, + "learning_rate": 2.3557431497370605e-05, + "loss": 0.1312, + "step": 22770 + }, + { + "epoch": 2.23, + "learning_rate": 2.355327982286189e-05, + "loss": 0.131, + "step": 22775 + }, + { + "epoch": 2.23, + "learning_rate": 2.354912814835317e-05, + "loss": 0.1125, + "step": 22780 + }, + { + "epoch": 2.23, + "learning_rate": 2.354497647384445e-05, + "loss": 0.1368, + "step": 22785 + }, + { + "epoch": 2.23, + "learning_rate": 2.354082479933573e-05, + "loss": 0.1362, + "step": 22790 + }, + { + "epoch": 2.23, + "learning_rate": 2.3536673124827012e-05, + "loss": 0.1213, + "step": 22795 + }, + { + "epoch": 2.23, + "learning_rate": 2.3532521450318296e-05, + "loss": 0.1201, + "step": 22800 + }, + { + "epoch": 2.23, + "learning_rate": 2.3528369775809577e-05, + "loss": 0.1542, + "step": 22805 + }, + { + "epoch": 2.23, + "learning_rate": 2.3524218101300858e-05, + "loss": 0.1367, + "step": 22810 + }, + { + "epoch": 2.23, + "learning_rate": 2.3520066426792142e-05, + "loss": 0.1207, + "step": 22815 + }, + { + "epoch": 2.23, + "learning_rate": 2.3515914752283423e-05, + "loss": 0.1502, + "step": 22820 + }, + { + "epoch": 2.23, + "learning_rate": 2.3511763077774704e-05, + "loss": 0.1361, + "step": 22825 + }, + { + "epoch": 2.23, + "learning_rate": 2.3507611403265984e-05, + "loss": 0.114, + "step": 22830 + }, + { + "epoch": 2.23, + "learning_rate": 2.3503459728757265e-05, + "loss": 0.1014, + "step": 22835 + }, + { + "epoch": 2.23, + "learning_rate": 2.3499308054248546e-05, + "loss": 0.1416, + "step": 22840 + }, + { + "epoch": 2.23, + "learning_rate": 2.3495156379739827e-05, + "loss": 0.1275, + "step": 22845 + }, + { + "epoch": 2.23, + "learning_rate": 2.349100470523111e-05, + "loss": 0.1177, + "step": 22850 + }, + { + "epoch": 2.23, + "learning_rate": 2.348685303072239e-05, + "loss": 0.1649, + "step": 22855 + }, + { + "epoch": 2.24, + "learning_rate": 2.3482701356213676e-05, + "loss": 0.1252, + "step": 22860 + }, + { + "epoch": 2.24, + "learning_rate": 2.3478549681704957e-05, + "loss": 0.1148, + "step": 22865 + }, + { + "epoch": 2.24, + "learning_rate": 2.3474398007196237e-05, + "loss": 0.1279, + "step": 22870 + }, + { + "epoch": 2.24, + "learning_rate": 2.3470246332687518e-05, + "loss": 0.1303, + "step": 22875 + }, + { + "epoch": 2.24, + "learning_rate": 2.34660946581788e-05, + "loss": 0.1278, + "step": 22880 + }, + { + "epoch": 2.24, + "learning_rate": 2.346194298367008e-05, + "loss": 0.1197, + "step": 22885 + }, + { + "epoch": 2.24, + "learning_rate": 2.345779130916136e-05, + "loss": 0.1437, + "step": 22890 + }, + { + "epoch": 2.24, + "learning_rate": 2.345363963465264e-05, + "loss": 0.1326, + "step": 22895 + }, + { + "epoch": 2.24, + "learning_rate": 2.3449487960143925e-05, + "loss": 0.1203, + "step": 22900 + }, + { + "epoch": 2.24, + "learning_rate": 2.344533628563521e-05, + "loss": 0.1414, + "step": 22905 + }, + { + "epoch": 2.24, + "learning_rate": 2.344118461112649e-05, + "loss": 0.1338, + "step": 22910 + }, + { + "epoch": 2.24, + "learning_rate": 2.343703293661777e-05, + "loss": 0.1104, + "step": 22915 + }, + { + "epoch": 2.24, + "learning_rate": 2.3432881262109052e-05, + "loss": 0.1191, + "step": 22920 + }, + { + "epoch": 2.24, + "learning_rate": 2.3428729587600333e-05, + "loss": 0.14, + "step": 22925 + }, + { + "epoch": 2.24, + "learning_rate": 2.3424577913091613e-05, + "loss": 0.1205, + "step": 22930 + }, + { + "epoch": 2.24, + "learning_rate": 2.3420426238582894e-05, + "loss": 0.1014, + "step": 22935 + }, + { + "epoch": 2.24, + "learning_rate": 2.3416274564074175e-05, + "loss": 0.1458, + "step": 22940 + }, + { + "epoch": 2.24, + "learning_rate": 2.3412122889565456e-05, + "loss": 0.1111, + "step": 22945 + }, + { + "epoch": 2.24, + "learning_rate": 2.3407971215056743e-05, + "loss": 0.1149, + "step": 22950 + }, + { + "epoch": 2.24, + "learning_rate": 2.3403819540548024e-05, + "loss": 0.1405, + "step": 22955 + }, + { + "epoch": 2.25, + "learning_rate": 2.3399667866039305e-05, + "loss": 0.1171, + "step": 22960 + }, + { + "epoch": 2.25, + "learning_rate": 2.3395516191530586e-05, + "loss": 0.1202, + "step": 22965 + }, + { + "epoch": 2.25, + "learning_rate": 2.3391364517021866e-05, + "loss": 0.1325, + "step": 22970 + }, + { + "epoch": 2.25, + "learning_rate": 2.3387212842513147e-05, + "loss": 0.1429, + "step": 22975 + }, + { + "epoch": 2.25, + "learning_rate": 2.3383061168004428e-05, + "loss": 0.1174, + "step": 22980 + }, + { + "epoch": 2.25, + "learning_rate": 2.337890949349571e-05, + "loss": 0.131, + "step": 22985 + }, + { + "epoch": 2.25, + "learning_rate": 2.337475781898699e-05, + "loss": 0.1502, + "step": 22990 + }, + { + "epoch": 2.25, + "learning_rate": 2.3370606144478274e-05, + "loss": 0.1281, + "step": 22995 + }, + { + "epoch": 2.25, + "learning_rate": 2.3366454469969554e-05, + "loss": 0.1315, + "step": 23000 + }, + { + "epoch": 2.25, + "eval_cer": 0.06434651109554167, + "eval_loss": 0.26808956265449524, + "eval_runtime": 281.0952, + "eval_samples_per_second": 58.236, + "eval_steps_per_second": 1.619, + "eval_wer": 0.16396439928694095, + "step": 23000 + }, + { + "epoch": 2.25, + "learning_rate": 2.336230279546084e-05, + "loss": 0.152, + "step": 23005 + }, + { + "epoch": 2.25, + "learning_rate": 2.335815112095212e-05, + "loss": 0.1261, + "step": 23010 + }, + { + "epoch": 2.25, + "learning_rate": 2.33539994464434e-05, + "loss": 0.1159, + "step": 23015 + }, + { + "epoch": 2.25, + "learning_rate": 2.334984777193468e-05, + "loss": 0.1411, + "step": 23020 + }, + { + "epoch": 2.25, + "learning_rate": 2.334569609742596e-05, + "loss": 0.1641, + "step": 23025 + }, + { + "epoch": 2.25, + "learning_rate": 2.3341544422917242e-05, + "loss": 0.1253, + "step": 23030 + }, + { + "epoch": 2.25, + "learning_rate": 2.3337392748408526e-05, + "loss": 0.1405, + "step": 23035 + }, + { + "epoch": 2.25, + "learning_rate": 2.3333241073899807e-05, + "loss": 0.1367, + "step": 23040 + }, + { + "epoch": 2.25, + "learning_rate": 2.3329089399391088e-05, + "loss": 0.1376, + "step": 23045 + }, + { + "epoch": 2.25, + "learning_rate": 2.332493772488237e-05, + "loss": 0.1322, + "step": 23050 + }, + { + "epoch": 2.25, + "learning_rate": 2.3320786050373653e-05, + "loss": 0.1498, + "step": 23055 + }, + { + "epoch": 2.25, + "learning_rate": 2.3316634375864934e-05, + "loss": 0.118, + "step": 23060 + }, + { + "epoch": 2.26, + "learning_rate": 2.3312482701356214e-05, + "loss": 0.1164, + "step": 23065 + }, + { + "epoch": 2.26, + "learning_rate": 2.3308331026847495e-05, + "loss": 0.1239, + "step": 23070 + }, + { + "epoch": 2.26, + "learning_rate": 2.3304179352338776e-05, + "loss": 0.1407, + "step": 23075 + }, + { + "epoch": 2.26, + "learning_rate": 2.330002767783006e-05, + "loss": 0.1225, + "step": 23080 + }, + { + "epoch": 2.26, + "learning_rate": 2.329587600332134e-05, + "loss": 0.123, + "step": 23085 + }, + { + "epoch": 2.26, + "learning_rate": 2.329172432881262e-05, + "loss": 0.1398, + "step": 23090 + }, + { + "epoch": 2.26, + "learning_rate": 2.3287572654303902e-05, + "loss": 0.1324, + "step": 23095 + }, + { + "epoch": 2.26, + "learning_rate": 2.3283420979795183e-05, + "loss": 0.1139, + "step": 23100 + }, + { + "epoch": 2.26, + "learning_rate": 2.3279269305286467e-05, + "loss": 0.15, + "step": 23105 + }, + { + "epoch": 2.26, + "learning_rate": 2.3275117630777748e-05, + "loss": 0.1233, + "step": 23110 + }, + { + "epoch": 2.26, + "learning_rate": 2.327096595626903e-05, + "loss": 0.128, + "step": 23115 + }, + { + "epoch": 2.26, + "learning_rate": 2.326681428176031e-05, + "loss": 0.1348, + "step": 23120 + }, + { + "epoch": 2.26, + "learning_rate": 2.3262662607251594e-05, + "loss": 0.138, + "step": 23125 + }, + { + "epoch": 2.26, + "learning_rate": 2.3258510932742875e-05, + "loss": 0.1146, + "step": 23130 + }, + { + "epoch": 2.26, + "learning_rate": 2.3254359258234155e-05, + "loss": 0.1181, + "step": 23135 + }, + { + "epoch": 2.26, + "learning_rate": 2.3250207583725436e-05, + "loss": 0.1531, + "step": 23140 + }, + { + "epoch": 2.26, + "learning_rate": 2.3246055909216717e-05, + "loss": 0.1147, + "step": 23145 + }, + { + "epoch": 2.26, + "learning_rate": 2.3241904234707998e-05, + "loss": 0.1355, + "step": 23150 + }, + { + "epoch": 2.26, + "learning_rate": 2.3237752560199282e-05, + "loss": 0.1294, + "step": 23155 + }, + { + "epoch": 2.26, + "learning_rate": 2.3233600885690563e-05, + "loss": 0.1319, + "step": 23160 + }, + { + "epoch": 2.27, + "learning_rate": 2.3229449211181843e-05, + "loss": 0.1209, + "step": 23165 + }, + { + "epoch": 2.27, + "learning_rate": 2.3225297536673128e-05, + "loss": 0.1424, + "step": 23170 + }, + { + "epoch": 2.27, + "learning_rate": 2.3221145862164408e-05, + "loss": 0.1566, + "step": 23175 + }, + { + "epoch": 2.27, + "learning_rate": 2.321699418765569e-05, + "loss": 0.1171, + "step": 23180 + }, + { + "epoch": 2.27, + "learning_rate": 2.321284251314697e-05, + "loss": 0.127, + "step": 23185 + }, + { + "epoch": 2.27, + "learning_rate": 2.320869083863825e-05, + "loss": 0.1545, + "step": 23190 + }, + { + "epoch": 2.27, + "learning_rate": 2.320453916412953e-05, + "loss": 0.1198, + "step": 23195 + }, + { + "epoch": 2.27, + "learning_rate": 2.3200387489620812e-05, + "loss": 0.1196, + "step": 23200 + }, + { + "epoch": 2.27, + "learning_rate": 2.3196235815112093e-05, + "loss": 0.164, + "step": 23205 + }, + { + "epoch": 2.27, + "learning_rate": 2.3192084140603377e-05, + "loss": 0.1285, + "step": 23210 + }, + { + "epoch": 2.27, + "learning_rate": 2.318793246609466e-05, + "loss": 0.1227, + "step": 23215 + }, + { + "epoch": 2.27, + "learning_rate": 2.3183780791585942e-05, + "loss": 0.1094, + "step": 23220 + }, + { + "epoch": 2.27, + "learning_rate": 2.3179629117077223e-05, + "loss": 0.1352, + "step": 23225 + }, + { + "epoch": 2.27, + "learning_rate": 2.3175477442568504e-05, + "loss": 0.1269, + "step": 23230 + }, + { + "epoch": 2.27, + "learning_rate": 2.3171325768059784e-05, + "loss": 0.1254, + "step": 23235 + }, + { + "epoch": 2.27, + "learning_rate": 2.3167174093551065e-05, + "loss": 0.1585, + "step": 23240 + }, + { + "epoch": 2.27, + "learning_rate": 2.3163022419042346e-05, + "loss": 0.1149, + "step": 23245 + }, + { + "epoch": 2.27, + "learning_rate": 2.3158870744533627e-05, + "loss": 0.1261, + "step": 23250 + }, + { + "epoch": 2.27, + "learning_rate": 2.315471907002491e-05, + "loss": 0.1436, + "step": 23255 + }, + { + "epoch": 2.27, + "learning_rate": 2.3150567395516195e-05, + "loss": 0.1369, + "step": 23260 + }, + { + "epoch": 2.27, + "learning_rate": 2.3146415721007476e-05, + "loss": 0.1356, + "step": 23265 + }, + { + "epoch": 2.28, + "learning_rate": 2.3142264046498756e-05, + "loss": 0.1347, + "step": 23270 + }, + { + "epoch": 2.28, + "learning_rate": 2.3138112371990037e-05, + "loss": 0.1504, + "step": 23275 + }, + { + "epoch": 2.28, + "learning_rate": 2.3133960697481318e-05, + "loss": 0.1154, + "step": 23280 + }, + { + "epoch": 2.28, + "learning_rate": 2.31298090229726e-05, + "loss": 0.1436, + "step": 23285 + }, + { + "epoch": 2.28, + "learning_rate": 2.312565734846388e-05, + "loss": 0.1452, + "step": 23290 + }, + { + "epoch": 2.28, + "learning_rate": 2.312150567395516e-05, + "loss": 0.1197, + "step": 23295 + }, + { + "epoch": 2.28, + "learning_rate": 2.3117353999446444e-05, + "loss": 0.1109, + "step": 23300 + }, + { + "epoch": 2.28, + "learning_rate": 2.3113202324937725e-05, + "loss": 0.1323, + "step": 23305 + }, + { + "epoch": 2.28, + "learning_rate": 2.310905065042901e-05, + "loss": 0.1191, + "step": 23310 + }, + { + "epoch": 2.28, + "learning_rate": 2.310489897592029e-05, + "loss": 0.1099, + "step": 23315 + }, + { + "epoch": 2.28, + "learning_rate": 2.310074730141157e-05, + "loss": 0.1261, + "step": 23320 + }, + { + "epoch": 2.28, + "learning_rate": 2.309659562690285e-05, + "loss": 0.141, + "step": 23325 + }, + { + "epoch": 2.28, + "learning_rate": 2.3092443952394132e-05, + "loss": 0.1209, + "step": 23330 + }, + { + "epoch": 2.28, + "learning_rate": 2.3088292277885413e-05, + "loss": 0.1157, + "step": 23335 + }, + { + "epoch": 2.28, + "learning_rate": 2.3084140603376694e-05, + "loss": 0.1343, + "step": 23340 + }, + { + "epoch": 2.28, + "learning_rate": 2.3079988928867978e-05, + "loss": 0.1282, + "step": 23345 + }, + { + "epoch": 2.28, + "learning_rate": 2.307583725435926e-05, + "loss": 0.1288, + "step": 23350 + }, + { + "epoch": 2.28, + "learning_rate": 2.307168557985054e-05, + "loss": 0.1567, + "step": 23355 + }, + { + "epoch": 2.28, + "learning_rate": 2.3067533905341824e-05, + "loss": 0.1285, + "step": 23360 + }, + { + "epoch": 2.28, + "learning_rate": 2.3063382230833105e-05, + "loss": 0.1191, + "step": 23365 + }, + { + "epoch": 2.29, + "learning_rate": 2.3059230556324385e-05, + "loss": 0.1253, + "step": 23370 + }, + { + "epoch": 2.29, + "learning_rate": 2.3055078881815666e-05, + "loss": 0.1439, + "step": 23375 + }, + { + "epoch": 2.29, + "learning_rate": 2.3050927207306947e-05, + "loss": 0.1104, + "step": 23380 + }, + { + "epoch": 2.29, + "learning_rate": 2.3046775532798228e-05, + "loss": 0.1169, + "step": 23385 + }, + { + "epoch": 2.29, + "learning_rate": 2.3042623858289512e-05, + "loss": 0.1719, + "step": 23390 + }, + { + "epoch": 2.29, + "learning_rate": 2.3038472183780793e-05, + "loss": 0.1271, + "step": 23395 + }, + { + "epoch": 2.29, + "learning_rate": 2.3034320509272073e-05, + "loss": 0.127, + "step": 23400 + }, + { + "epoch": 2.29, + "learning_rate": 2.3030168834763354e-05, + "loss": 0.1311, + "step": 23405 + }, + { + "epoch": 2.29, + "learning_rate": 2.3026017160254635e-05, + "loss": 0.1196, + "step": 23410 + }, + { + "epoch": 2.29, + "learning_rate": 2.302186548574592e-05, + "loss": 0.1277, + "step": 23415 + }, + { + "epoch": 2.29, + "learning_rate": 2.30177138112372e-05, + "loss": 0.1309, + "step": 23420 + }, + { + "epoch": 2.29, + "learning_rate": 2.301356213672848e-05, + "loss": 0.1425, + "step": 23425 + }, + { + "epoch": 2.29, + "learning_rate": 2.300941046221976e-05, + "loss": 0.1124, + "step": 23430 + }, + { + "epoch": 2.29, + "learning_rate": 2.3005258787711046e-05, + "loss": 0.1328, + "step": 23435 + }, + { + "epoch": 2.29, + "learning_rate": 2.3001107113202326e-05, + "loss": 0.1507, + "step": 23440 + }, + { + "epoch": 2.29, + "learning_rate": 2.2996955438693607e-05, + "loss": 0.1094, + "step": 23445 + }, + { + "epoch": 2.29, + "learning_rate": 2.2992803764184888e-05, + "loss": 0.1066, + "step": 23450 + }, + { + "epoch": 2.29, + "learning_rate": 2.298865208967617e-05, + "loss": 0.1708, + "step": 23455 + }, + { + "epoch": 2.29, + "learning_rate": 2.298450041516745e-05, + "loss": 0.1333, + "step": 23460 + }, + { + "epoch": 2.29, + "learning_rate": 2.2980348740658734e-05, + "loss": 0.1214, + "step": 23465 + }, + { + "epoch": 2.29, + "learning_rate": 2.2976197066150014e-05, + "loss": 0.1218, + "step": 23470 + }, + { + "epoch": 2.3, + "learning_rate": 2.2972045391641295e-05, + "loss": 0.1445, + "step": 23475 + }, + { + "epoch": 2.3, + "learning_rate": 2.296789371713258e-05, + "loss": 0.1118, + "step": 23480 + }, + { + "epoch": 2.3, + "learning_rate": 2.296374204262386e-05, + "loss": 0.1236, + "step": 23485 + }, + { + "epoch": 2.3, + "learning_rate": 2.295959036811514e-05, + "loss": 0.1462, + "step": 23490 + }, + { + "epoch": 2.3, + "learning_rate": 2.295543869360642e-05, + "loss": 0.1207, + "step": 23495 + }, + { + "epoch": 2.3, + "learning_rate": 2.2951287019097702e-05, + "loss": 0.1218, + "step": 23500 + }, + { + "epoch": 2.3, + "eval_cer": 0.06392914206964166, + "eval_loss": 0.2615985572338104, + "eval_runtime": 278.9422, + "eval_samples_per_second": 58.686, + "eval_steps_per_second": 1.631, + "eval_wer": 0.1607386560273731, + "step": 23500 + }, + { + "epoch": 2.3, + "learning_rate": 2.2947135344588983e-05, + "loss": 0.1558, + "step": 23505 + }, + { + "epoch": 2.3, + "learning_rate": 2.2942983670080264e-05, + "loss": 0.152, + "step": 23510 + }, + { + "epoch": 2.3, + "learning_rate": 2.2938831995571548e-05, + "loss": 0.1085, + "step": 23515 + }, + { + "epoch": 2.3, + "learning_rate": 2.2934680321062832e-05, + "loss": 0.1216, + "step": 23520 + }, + { + "epoch": 2.3, + "learning_rate": 2.2930528646554113e-05, + "loss": 0.1494, + "step": 23525 + }, + { + "epoch": 2.3, + "learning_rate": 2.2926376972045394e-05, + "loss": 0.1268, + "step": 23530 + }, + { + "epoch": 2.3, + "learning_rate": 2.2922225297536674e-05, + "loss": 0.1155, + "step": 23535 + }, + { + "epoch": 2.3, + "learning_rate": 2.2918073623027955e-05, + "loss": 0.1445, + "step": 23540 + }, + { + "epoch": 2.3, + "learning_rate": 2.2913921948519236e-05, + "loss": 0.1227, + "step": 23545 + }, + { + "epoch": 2.3, + "learning_rate": 2.2909770274010517e-05, + "loss": 0.1149, + "step": 23550 + }, + { + "epoch": 2.3, + "learning_rate": 2.2905618599501798e-05, + "loss": 0.1388, + "step": 23555 + }, + { + "epoch": 2.3, + "learning_rate": 2.2901466924993078e-05, + "loss": 0.1328, + "step": 23560 + }, + { + "epoch": 2.3, + "learning_rate": 2.2897315250484366e-05, + "loss": 0.1148, + "step": 23565 + }, + { + "epoch": 2.3, + "learning_rate": 2.2893163575975647e-05, + "loss": 0.1272, + "step": 23570 + }, + { + "epoch": 2.31, + "learning_rate": 2.2889011901466927e-05, + "loss": 0.1253, + "step": 23575 + }, + { + "epoch": 2.31, + "learning_rate": 2.2884860226958208e-05, + "loss": 0.1273, + "step": 23580 + }, + { + "epoch": 2.31, + "learning_rate": 2.288070855244949e-05, + "loss": 0.1316, + "step": 23585 + }, + { + "epoch": 2.31, + "learning_rate": 2.287655687794077e-05, + "loss": 0.1395, + "step": 23590 + }, + { + "epoch": 2.31, + "learning_rate": 2.287240520343205e-05, + "loss": 0.1088, + "step": 23595 + }, + { + "epoch": 2.31, + "learning_rate": 2.286825352892333e-05, + "loss": 0.1182, + "step": 23600 + }, + { + "epoch": 2.31, + "learning_rate": 2.2864101854414612e-05, + "loss": 0.1436, + "step": 23605 + }, + { + "epoch": 2.31, + "learning_rate": 2.2859950179905896e-05, + "loss": 0.1196, + "step": 23610 + }, + { + "epoch": 2.31, + "learning_rate": 2.2855798505397177e-05, + "loss": 0.1141, + "step": 23615 + }, + { + "epoch": 2.31, + "learning_rate": 2.285164683088846e-05, + "loss": 0.1383, + "step": 23620 + }, + { + "epoch": 2.31, + "learning_rate": 2.2847495156379742e-05, + "loss": 0.1339, + "step": 23625 + }, + { + "epoch": 2.31, + "learning_rate": 2.2843343481871023e-05, + "loss": 0.1285, + "step": 23630 + }, + { + "epoch": 2.31, + "learning_rate": 2.2839191807362303e-05, + "loss": 0.1132, + "step": 23635 + }, + { + "epoch": 2.31, + "learning_rate": 2.2835040132853584e-05, + "loss": 0.1472, + "step": 23640 + }, + { + "epoch": 2.31, + "learning_rate": 2.2830888458344865e-05, + "loss": 0.1239, + "step": 23645 + }, + { + "epoch": 2.31, + "learning_rate": 2.2826736783836146e-05, + "loss": 0.1191, + "step": 23650 + }, + { + "epoch": 2.31, + "learning_rate": 2.282258510932743e-05, + "loss": 0.1388, + "step": 23655 + }, + { + "epoch": 2.31, + "learning_rate": 2.281843343481871e-05, + "loss": 0.1295, + "step": 23660 + }, + { + "epoch": 2.31, + "learning_rate": 2.281428176030999e-05, + "loss": 0.1142, + "step": 23665 + }, + { + "epoch": 2.31, + "learning_rate": 2.2810130085801276e-05, + "loss": 0.1315, + "step": 23670 + }, + { + "epoch": 2.32, + "learning_rate": 2.2805978411292556e-05, + "loss": 0.1456, + "step": 23675 + }, + { + "epoch": 2.32, + "learning_rate": 2.2801826736783837e-05, + "loss": 0.1222, + "step": 23680 + }, + { + "epoch": 2.32, + "learning_rate": 2.2797675062275118e-05, + "loss": 0.1154, + "step": 23685 + }, + { + "epoch": 2.32, + "learning_rate": 2.27935233877664e-05, + "loss": 0.1657, + "step": 23690 + }, + { + "epoch": 2.32, + "learning_rate": 2.278937171325768e-05, + "loss": 0.1121, + "step": 23695 + }, + { + "epoch": 2.32, + "learning_rate": 2.2785220038748964e-05, + "loss": 0.1062, + "step": 23700 + }, + { + "epoch": 2.32, + "learning_rate": 2.2781068364240244e-05, + "loss": 0.1505, + "step": 23705 + }, + { + "epoch": 2.32, + "learning_rate": 2.2776916689731525e-05, + "loss": 0.1183, + "step": 23710 + }, + { + "epoch": 2.32, + "learning_rate": 2.2772765015222806e-05, + "loss": 0.112, + "step": 23715 + }, + { + "epoch": 2.32, + "learning_rate": 2.276861334071409e-05, + "loss": 0.1449, + "step": 23720 + }, + { + "epoch": 2.32, + "learning_rate": 2.276446166620537e-05, + "loss": 0.133, + "step": 23725 + }, + { + "epoch": 2.32, + "learning_rate": 2.276030999169665e-05, + "loss": 0.1256, + "step": 23730 + }, + { + "epoch": 2.32, + "learning_rate": 2.2756158317187932e-05, + "loss": 0.1127, + "step": 23735 + }, + { + "epoch": 2.32, + "learning_rate": 2.2752006642679216e-05, + "loss": 0.1319, + "step": 23740 + }, + { + "epoch": 2.32, + "learning_rate": 2.2747854968170497e-05, + "loss": 0.1212, + "step": 23745 + }, + { + "epoch": 2.32, + "learning_rate": 2.2743703293661778e-05, + "loss": 0.1263, + "step": 23750 + }, + { + "epoch": 2.32, + "learning_rate": 2.273955161915306e-05, + "loss": 0.1326, + "step": 23755 + }, + { + "epoch": 2.32, + "learning_rate": 2.273539994464434e-05, + "loss": 0.1256, + "step": 23760 + }, + { + "epoch": 2.32, + "learning_rate": 2.273124827013562e-05, + "loss": 0.1187, + "step": 23765 + }, + { + "epoch": 2.32, + "learning_rate": 2.2727096595626904e-05, + "loss": 0.1286, + "step": 23770 + }, + { + "epoch": 2.32, + "learning_rate": 2.2722944921118185e-05, + "loss": 0.1202, + "step": 23775 + }, + { + "epoch": 2.33, + "learning_rate": 2.2718793246609466e-05, + "loss": 0.1022, + "step": 23780 + }, + { + "epoch": 2.33, + "learning_rate": 2.271464157210075e-05, + "loss": 0.1294, + "step": 23785 + }, + { + "epoch": 2.33, + "learning_rate": 2.271048989759203e-05, + "loss": 0.1463, + "step": 23790 + }, + { + "epoch": 2.33, + "learning_rate": 2.270633822308331e-05, + "loss": 0.1122, + "step": 23795 + }, + { + "epoch": 2.33, + "learning_rate": 2.2702186548574592e-05, + "loss": 0.1258, + "step": 23800 + }, + { + "epoch": 2.33, + "learning_rate": 2.2698865208967617e-05, + "loss": 0.1624, + "step": 23805 + }, + { + "epoch": 2.33, + "learning_rate": 2.2694713534458898e-05, + "loss": 0.1182, + "step": 23810 + }, + { + "epoch": 2.33, + "learning_rate": 2.2690561859950182e-05, + "loss": 0.1295, + "step": 23815 + }, + { + "epoch": 2.33, + "learning_rate": 2.2686410185441463e-05, + "loss": 0.132, + "step": 23820 + }, + { + "epoch": 2.33, + "learning_rate": 2.2682258510932743e-05, + "loss": 0.1618, + "step": 23825 + }, + { + "epoch": 2.33, + "learning_rate": 2.2678106836424024e-05, + "loss": 0.1183, + "step": 23830 + }, + { + "epoch": 2.33, + "learning_rate": 2.2673955161915305e-05, + "loss": 0.1002, + "step": 23835 + }, + { + "epoch": 2.33, + "learning_rate": 2.2669803487406586e-05, + "loss": 0.1429, + "step": 23840 + }, + { + "epoch": 2.33, + "learning_rate": 2.266565181289787e-05, + "loss": 0.106, + "step": 23845 + }, + { + "epoch": 2.33, + "learning_rate": 2.266150013838915e-05, + "loss": 0.1219, + "step": 23850 + }, + { + "epoch": 2.33, + "learning_rate": 2.265734846388043e-05, + "loss": 0.138, + "step": 23855 + }, + { + "epoch": 2.33, + "learning_rate": 2.2653196789371716e-05, + "loss": 0.1192, + "step": 23860 + }, + { + "epoch": 2.33, + "learning_rate": 2.2649045114862996e-05, + "loss": 0.1139, + "step": 23865 + }, + { + "epoch": 2.33, + "learning_rate": 2.2644893440354277e-05, + "loss": 0.137, + "step": 23870 + }, + { + "epoch": 2.33, + "learning_rate": 2.2640741765845558e-05, + "loss": 0.1482, + "step": 23875 + }, + { + "epoch": 2.34, + "learning_rate": 2.263659009133684e-05, + "loss": 0.1084, + "step": 23880 + }, + { + "epoch": 2.34, + "learning_rate": 2.263243841682812e-05, + "loss": 0.1235, + "step": 23885 + }, + { + "epoch": 2.34, + "learning_rate": 2.26282867423194e-05, + "loss": 0.1448, + "step": 23890 + }, + { + "epoch": 2.34, + "learning_rate": 2.2624135067810684e-05, + "loss": 0.1374, + "step": 23895 + }, + { + "epoch": 2.34, + "learning_rate": 2.261998339330197e-05, + "loss": 0.1152, + "step": 23900 + }, + { + "epoch": 2.34, + "learning_rate": 2.261583171879325e-05, + "loss": 0.1424, + "step": 23905 + }, + { + "epoch": 2.34, + "learning_rate": 2.261168004428453e-05, + "loss": 0.1152, + "step": 23910 + }, + { + "epoch": 2.34, + "learning_rate": 2.260752836977581e-05, + "loss": 0.1241, + "step": 23915 + }, + { + "epoch": 2.34, + "learning_rate": 2.260337669526709e-05, + "loss": 0.1457, + "step": 23920 + }, + { + "epoch": 2.34, + "learning_rate": 2.2599225020758372e-05, + "loss": 0.1337, + "step": 23925 + }, + { + "epoch": 2.34, + "learning_rate": 2.2595073346249653e-05, + "loss": 0.1008, + "step": 23930 + }, + { + "epoch": 2.34, + "learning_rate": 2.2590921671740934e-05, + "loss": 0.1382, + "step": 23935 + }, + { + "epoch": 2.34, + "learning_rate": 2.2586769997232215e-05, + "loss": 0.1562, + "step": 23940 + }, + { + "epoch": 2.34, + "learning_rate": 2.2582618322723502e-05, + "loss": 0.1026, + "step": 23945 + }, + { + "epoch": 2.34, + "learning_rate": 2.2578466648214783e-05, + "loss": 0.1161, + "step": 23950 + }, + { + "epoch": 2.34, + "learning_rate": 2.2574314973706064e-05, + "loss": 0.1425, + "step": 23955 + }, + { + "epoch": 2.34, + "learning_rate": 2.2570163299197345e-05, + "loss": 0.1282, + "step": 23960 + }, + { + "epoch": 2.34, + "learning_rate": 2.2566011624688625e-05, + "loss": 0.1362, + "step": 23965 + }, + { + "epoch": 2.34, + "learning_rate": 2.2561859950179906e-05, + "loss": 0.1163, + "step": 23970 + }, + { + "epoch": 2.34, + "learning_rate": 2.2557708275671187e-05, + "loss": 0.1398, + "step": 23975 + }, + { + "epoch": 2.34, + "learning_rate": 2.2553556601162468e-05, + "loss": 0.108, + "step": 23980 + }, + { + "epoch": 2.35, + "learning_rate": 2.254940492665375e-05, + "loss": 0.1222, + "step": 23985 + }, + { + "epoch": 2.35, + "learning_rate": 2.2545253252145033e-05, + "loss": 0.164, + "step": 23990 + }, + { + "epoch": 2.35, + "learning_rate": 2.2541101577636313e-05, + "loss": 0.1111, + "step": 23995 + }, + { + "epoch": 2.35, + "learning_rate": 2.2536949903127597e-05, + "loss": 0.1167, + "step": 24000 + }, + { + "epoch": 2.35, + "eval_cer": 0.06271518783918459, + "eval_loss": 0.273235023021698, + "eval_runtime": 274.0596, + "eval_samples_per_second": 59.732, + "eval_steps_per_second": 1.66, + "eval_wer": 0.15988324637756868, + "step": 24000 + }, + { + "epoch": 2.35, + "learning_rate": 2.2532798228618878e-05, + "loss": 0.1316, + "step": 24005 + }, + { + "epoch": 2.35, + "learning_rate": 2.252864655411016e-05, + "loss": 0.1198, + "step": 24010 + }, + { + "epoch": 2.35, + "learning_rate": 2.252449487960144e-05, + "loss": 0.1136, + "step": 24015 + }, + { + "epoch": 2.35, + "learning_rate": 2.252034320509272e-05, + "loss": 0.1377, + "step": 24020 + }, + { + "epoch": 2.35, + "learning_rate": 2.2516191530584e-05, + "loss": 0.1444, + "step": 24025 + }, + { + "epoch": 2.35, + "learning_rate": 2.2512039856075282e-05, + "loss": 0.1172, + "step": 24030 + }, + { + "epoch": 2.35, + "learning_rate": 2.2507888181566566e-05, + "loss": 0.1107, + "step": 24035 + }, + { + "epoch": 2.35, + "learning_rate": 2.2503736507057847e-05, + "loss": 0.1435, + "step": 24040 + }, + { + "epoch": 2.35, + "learning_rate": 2.2499584832549128e-05, + "loss": 0.1281, + "step": 24045 + }, + { + "epoch": 2.35, + "learning_rate": 2.2495433158040412e-05, + "loss": 0.1122, + "step": 24050 + }, + { + "epoch": 2.35, + "learning_rate": 2.2491281483531693e-05, + "loss": 0.1538, + "step": 24055 + }, + { + "epoch": 2.35, + "learning_rate": 2.2487129809022973e-05, + "loss": 0.1338, + "step": 24060 + }, + { + "epoch": 2.35, + "learning_rate": 2.2482978134514254e-05, + "loss": 0.1264, + "step": 24065 + }, + { + "epoch": 2.35, + "learning_rate": 2.2478826460005535e-05, + "loss": 0.1195, + "step": 24070 + }, + { + "epoch": 2.35, + "learning_rate": 2.2474674785496816e-05, + "loss": 0.1277, + "step": 24075 + }, + { + "epoch": 2.35, + "learning_rate": 2.24705231109881e-05, + "loss": 0.1167, + "step": 24080 + }, + { + "epoch": 2.36, + "learning_rate": 2.246637143647938e-05, + "loss": 0.1231, + "step": 24085 + }, + { + "epoch": 2.36, + "learning_rate": 2.246221976197066e-05, + "loss": 0.1489, + "step": 24090 + }, + { + "epoch": 2.36, + "learning_rate": 2.2458068087461942e-05, + "loss": 0.1168, + "step": 24095 + }, + { + "epoch": 2.36, + "learning_rate": 2.2453916412953226e-05, + "loss": 0.1047, + "step": 24100 + }, + { + "epoch": 2.36, + "learning_rate": 2.2449764738444507e-05, + "loss": 0.1236, + "step": 24105 + }, + { + "epoch": 2.36, + "learning_rate": 2.2445613063935788e-05, + "loss": 0.11, + "step": 24110 + }, + { + "epoch": 2.36, + "learning_rate": 2.244146138942707e-05, + "loss": 0.1066, + "step": 24115 + }, + { + "epoch": 2.36, + "learning_rate": 2.2437309714918353e-05, + "loss": 0.1246, + "step": 24120 + }, + { + "epoch": 2.36, + "learning_rate": 2.2433158040409634e-05, + "loss": 0.1234, + "step": 24125 + }, + { + "epoch": 2.36, + "learning_rate": 2.2429006365900914e-05, + "loss": 0.1233, + "step": 24130 + }, + { + "epoch": 2.36, + "learning_rate": 2.2424854691392195e-05, + "loss": 0.133, + "step": 24135 + }, + { + "epoch": 2.36, + "learning_rate": 2.2420703016883476e-05, + "loss": 0.1429, + "step": 24140 + }, + { + "epoch": 2.36, + "learning_rate": 2.2416551342374757e-05, + "loss": 0.121, + "step": 24145 + }, + { + "epoch": 2.36, + "learning_rate": 2.241239966786604e-05, + "loss": 0.118, + "step": 24150 + }, + { + "epoch": 2.36, + "learning_rate": 2.240824799335732e-05, + "loss": 0.1461, + "step": 24155 + }, + { + "epoch": 2.36, + "learning_rate": 2.2404096318848602e-05, + "loss": 0.1166, + "step": 24160 + }, + { + "epoch": 2.36, + "learning_rate": 2.2399944644339887e-05, + "loss": 0.1061, + "step": 24165 + }, + { + "epoch": 2.36, + "learning_rate": 2.2395792969831167e-05, + "loss": 0.1235, + "step": 24170 + }, + { + "epoch": 2.36, + "learning_rate": 2.2391641295322448e-05, + "loss": 0.1431, + "step": 24175 + }, + { + "epoch": 2.36, + "learning_rate": 2.238748962081373e-05, + "loss": 0.1203, + "step": 24180 + }, + { + "epoch": 2.36, + "learning_rate": 2.238333794630501e-05, + "loss": 0.1381, + "step": 24185 + }, + { + "epoch": 2.37, + "learning_rate": 2.237918627179629e-05, + "loss": 0.1401, + "step": 24190 + }, + { + "epoch": 2.37, + "learning_rate": 2.237503459728757e-05, + "loss": 0.1182, + "step": 24195 + }, + { + "epoch": 2.37, + "learning_rate": 2.2370882922778852e-05, + "loss": 0.1204, + "step": 24200 + }, + { + "epoch": 2.37, + "learning_rate": 2.2366731248270136e-05, + "loss": 0.1338, + "step": 24205 + }, + { + "epoch": 2.37, + "learning_rate": 2.236257957376142e-05, + "loss": 0.1437, + "step": 24210 + }, + { + "epoch": 2.37, + "learning_rate": 2.23584278992527e-05, + "loss": 0.1176, + "step": 24215 + }, + { + "epoch": 2.37, + "learning_rate": 2.2354276224743982e-05, + "loss": 0.1417, + "step": 24220 + }, + { + "epoch": 2.37, + "learning_rate": 2.2350124550235263e-05, + "loss": 0.1276, + "step": 24225 + }, + { + "epoch": 2.37, + "learning_rate": 2.2345972875726543e-05, + "loss": 0.1113, + "step": 24230 + }, + { + "epoch": 2.37, + "learning_rate": 2.2341821201217824e-05, + "loss": 0.1111, + "step": 24235 + }, + { + "epoch": 2.37, + "learning_rate": 2.2337669526709105e-05, + "loss": 0.1431, + "step": 24240 + }, + { + "epoch": 2.37, + "learning_rate": 2.2333517852200386e-05, + "loss": 0.1261, + "step": 24245 + }, + { + "epoch": 2.37, + "learning_rate": 2.2329366177691666e-05, + "loss": 0.1095, + "step": 24250 + }, + { + "epoch": 2.37, + "learning_rate": 2.2325214503182954e-05, + "loss": 0.1498, + "step": 24255 + }, + { + "epoch": 2.37, + "learning_rate": 2.2321062828674235e-05, + "loss": 0.1201, + "step": 24260 + }, + { + "epoch": 2.37, + "learning_rate": 2.2316911154165515e-05, + "loss": 0.1251, + "step": 24265 + }, + { + "epoch": 2.37, + "learning_rate": 2.2312759479656796e-05, + "loss": 0.1451, + "step": 24270 + }, + { + "epoch": 2.37, + "learning_rate": 2.2308607805148077e-05, + "loss": 0.1393, + "step": 24275 + }, + { + "epoch": 2.37, + "learning_rate": 2.2304456130639358e-05, + "loss": 0.1243, + "step": 24280 + }, + { + "epoch": 2.37, + "learning_rate": 2.230030445613064e-05, + "loss": 0.113, + "step": 24285 + }, + { + "epoch": 2.38, + "learning_rate": 2.229615278162192e-05, + "loss": 0.1458, + "step": 24290 + }, + { + "epoch": 2.38, + "learning_rate": 2.22920011071132e-05, + "loss": 0.1145, + "step": 24295 + }, + { + "epoch": 2.38, + "learning_rate": 2.2287849432604484e-05, + "loss": 0.1244, + "step": 24300 + }, + { + "epoch": 2.38, + "learning_rate": 2.228369775809577e-05, + "loss": 0.144, + "step": 24305 + }, + { + "epoch": 2.38, + "learning_rate": 2.227954608358705e-05, + "loss": 0.1149, + "step": 24310 + }, + { + "epoch": 2.38, + "learning_rate": 2.227539440907833e-05, + "loss": 0.1136, + "step": 24315 + }, + { + "epoch": 2.38, + "learning_rate": 2.227124273456961e-05, + "loss": 0.145, + "step": 24320 + }, + { + "epoch": 2.38, + "learning_rate": 2.226709106006089e-05, + "loss": 0.1396, + "step": 24325 + }, + { + "epoch": 2.38, + "learning_rate": 2.2262939385552172e-05, + "loss": 0.1329, + "step": 24330 + }, + { + "epoch": 2.38, + "learning_rate": 2.2258787711043453e-05, + "loss": 0.123, + "step": 24335 + }, + { + "epoch": 2.38, + "learning_rate": 2.2254636036534737e-05, + "loss": 0.139, + "step": 24340 + }, + { + "epoch": 2.38, + "learning_rate": 2.2250484362026018e-05, + "loss": 0.1046, + "step": 24345 + }, + { + "epoch": 2.38, + "learning_rate": 2.22463326875173e-05, + "loss": 0.1329, + "step": 24350 + }, + { + "epoch": 2.38, + "learning_rate": 2.2242181013008583e-05, + "loss": 0.1452, + "step": 24355 + }, + { + "epoch": 2.38, + "learning_rate": 2.2238029338499864e-05, + "loss": 0.1229, + "step": 24360 + }, + { + "epoch": 2.38, + "learning_rate": 2.2233877663991144e-05, + "loss": 0.1196, + "step": 24365 + }, + { + "epoch": 2.38, + "learning_rate": 2.2229725989482425e-05, + "loss": 0.1214, + "step": 24370 + }, + { + "epoch": 2.38, + "learning_rate": 2.2225574314973706e-05, + "loss": 0.1396, + "step": 24375 + }, + { + "epoch": 2.38, + "learning_rate": 2.2221422640464987e-05, + "loss": 0.123, + "step": 24380 + }, + { + "epoch": 2.38, + "learning_rate": 2.221727096595627e-05, + "loss": 0.113, + "step": 24385 + }, + { + "epoch": 2.38, + "learning_rate": 2.221311929144755e-05, + "loss": 0.1797, + "step": 24390 + }, + { + "epoch": 2.39, + "learning_rate": 2.2208967616938832e-05, + "loss": 0.1168, + "step": 24395 + }, + { + "epoch": 2.39, + "learning_rate": 2.2204815942430113e-05, + "loss": 0.1049, + "step": 24400 + }, + { + "epoch": 2.39, + "learning_rate": 2.2200664267921394e-05, + "loss": 0.1215, + "step": 24405 + }, + { + "epoch": 2.39, + "learning_rate": 2.2196512593412678e-05, + "loss": 0.1285, + "step": 24410 + }, + { + "epoch": 2.39, + "learning_rate": 2.219236091890396e-05, + "loss": 0.1013, + "step": 24415 + }, + { + "epoch": 2.39, + "learning_rate": 2.218820924439524e-05, + "loss": 0.1208, + "step": 24420 + }, + { + "epoch": 2.39, + "learning_rate": 2.218405756988652e-05, + "loss": 0.1314, + "step": 24425 + }, + { + "epoch": 2.39, + "learning_rate": 2.2179905895377805e-05, + "loss": 0.1135, + "step": 24430 + }, + { + "epoch": 2.39, + "learning_rate": 2.2175754220869085e-05, + "loss": 0.1241, + "step": 24435 + }, + { + "epoch": 2.39, + "learning_rate": 2.2171602546360366e-05, + "loss": 0.1496, + "step": 24440 + }, + { + "epoch": 2.39, + "learning_rate": 2.2167450871851647e-05, + "loss": 0.1212, + "step": 24445 + }, + { + "epoch": 2.39, + "learning_rate": 2.2163299197342928e-05, + "loss": 0.1279, + "step": 24450 + }, + { + "epoch": 2.39, + "learning_rate": 2.215914752283421e-05, + "loss": 0.1475, + "step": 24455 + }, + { + "epoch": 2.39, + "learning_rate": 2.2154995848325493e-05, + "loss": 0.1187, + "step": 24460 + }, + { + "epoch": 2.39, + "learning_rate": 2.2150844173816773e-05, + "loss": 0.1164, + "step": 24465 + }, + { + "epoch": 2.39, + "learning_rate": 2.2146692499308054e-05, + "loss": 0.1383, + "step": 24470 + }, + { + "epoch": 2.39, + "learning_rate": 2.2142540824799338e-05, + "loss": 0.1396, + "step": 24475 + }, + { + "epoch": 2.39, + "learning_rate": 2.213838915029062e-05, + "loss": 0.1177, + "step": 24480 + }, + { + "epoch": 2.39, + "learning_rate": 2.21342374757819e-05, + "loss": 0.1212, + "step": 24485 + }, + { + "epoch": 2.39, + "learning_rate": 2.213008580127318e-05, + "loss": 0.1538, + "step": 24490 + }, + { + "epoch": 2.4, + "learning_rate": 2.212593412676446e-05, + "loss": 0.1299, + "step": 24495 + }, + { + "epoch": 2.4, + "learning_rate": 2.2121782452255742e-05, + "loss": 0.1009, + "step": 24500 + }, + { + "epoch": 2.4, + "eval_cer": 0.06267703499194166, + "eval_loss": 0.2565563917160034, + "eval_runtime": 277.9762, + "eval_samples_per_second": 58.89, + "eval_steps_per_second": 1.637, + "eval_wer": 0.1600138432706686, + "step": 24500 + }, + { + "epoch": 2.4, + "learning_rate": 2.2117630777747023e-05, + "loss": 0.1407, + "step": 24505 + }, + { + "epoch": 2.4, + "learning_rate": 2.2113479103238307e-05, + "loss": 0.1185, + "step": 24510 + }, + { + "epoch": 2.4, + "learning_rate": 2.2109327428729588e-05, + "loss": 0.1232, + "step": 24515 + }, + { + "epoch": 2.4, + "learning_rate": 2.2105175754220872e-05, + "loss": 0.1261, + "step": 24520 + }, + { + "epoch": 2.4, + "learning_rate": 2.2101024079712153e-05, + "loss": 0.1308, + "step": 24525 + }, + { + "epoch": 2.4, + "learning_rate": 2.2096872405203433e-05, + "loss": 0.1335, + "step": 24530 + }, + { + "epoch": 2.4, + "learning_rate": 2.2092720730694714e-05, + "loss": 0.1359, + "step": 24535 + }, + { + "epoch": 2.4, + "learning_rate": 2.2088569056185995e-05, + "loss": 0.1332, + "step": 24540 + }, + { + "epoch": 2.4, + "learning_rate": 2.2084417381677276e-05, + "loss": 0.1221, + "step": 24545 + }, + { + "epoch": 2.4, + "learning_rate": 2.2080265707168557e-05, + "loss": 0.1112, + "step": 24550 + }, + { + "epoch": 2.4, + "learning_rate": 2.2076114032659837e-05, + "loss": 0.1525, + "step": 24555 + }, + { + "epoch": 2.4, + "learning_rate": 2.207196235815112e-05, + "loss": 0.1231, + "step": 24560 + }, + { + "epoch": 2.4, + "learning_rate": 2.2067810683642406e-05, + "loss": 0.1277, + "step": 24565 + }, + { + "epoch": 2.4, + "learning_rate": 2.2063659009133686e-05, + "loss": 0.1263, + "step": 24570 + }, + { + "epoch": 2.4, + "learning_rate": 2.2059507334624967e-05, + "loss": 0.1202, + "step": 24575 + }, + { + "epoch": 2.4, + "learning_rate": 2.2055355660116248e-05, + "loss": 0.1086, + "step": 24580 + }, + { + "epoch": 2.4, + "learning_rate": 2.205120398560753e-05, + "loss": 0.1187, + "step": 24585 + }, + { + "epoch": 2.4, + "learning_rate": 2.204705231109881e-05, + "loss": 0.159, + "step": 24590 + }, + { + "epoch": 2.4, + "learning_rate": 2.204290063659009e-05, + "loss": 0.1287, + "step": 24595 + }, + { + "epoch": 2.41, + "learning_rate": 2.203874896208137e-05, + "loss": 0.1264, + "step": 24600 + }, + { + "epoch": 2.41, + "learning_rate": 2.2034597287572655e-05, + "loss": 0.165, + "step": 24605 + }, + { + "epoch": 2.41, + "learning_rate": 2.2030445613063936e-05, + "loss": 0.1212, + "step": 24610 + }, + { + "epoch": 2.41, + "learning_rate": 2.202629393855522e-05, + "loss": 0.1082, + "step": 24615 + }, + { + "epoch": 2.41, + "learning_rate": 2.20221422640465e-05, + "loss": 0.1066, + "step": 24620 + }, + { + "epoch": 2.41, + "learning_rate": 2.201799058953778e-05, + "loss": 0.1265, + "step": 24625 + }, + { + "epoch": 2.41, + "learning_rate": 2.2013838915029062e-05, + "loss": 0.11, + "step": 24630 + }, + { + "epoch": 2.41, + "learning_rate": 2.2009687240520343e-05, + "loss": 0.1165, + "step": 24635 + }, + { + "epoch": 2.41, + "learning_rate": 2.2005535566011624e-05, + "loss": 0.1346, + "step": 24640 + }, + { + "epoch": 2.41, + "learning_rate": 2.2001383891502905e-05, + "loss": 0.1159, + "step": 24645 + }, + { + "epoch": 2.41, + "learning_rate": 2.199723221699419e-05, + "loss": 0.1025, + "step": 24650 + }, + { + "epoch": 2.41, + "learning_rate": 2.199308054248547e-05, + "loss": 0.1245, + "step": 24655 + }, + { + "epoch": 2.41, + "learning_rate": 2.198892886797675e-05, + "loss": 0.1233, + "step": 24660 + }, + { + "epoch": 2.41, + "learning_rate": 2.1984777193468035e-05, + "loss": 0.1107, + "step": 24665 + }, + { + "epoch": 2.41, + "learning_rate": 2.1980625518959315e-05, + "loss": 0.152, + "step": 24670 + }, + { + "epoch": 2.41, + "learning_rate": 2.1976473844450596e-05, + "loss": 0.1334, + "step": 24675 + }, + { + "epoch": 2.41, + "learning_rate": 2.1972322169941877e-05, + "loss": 0.1134, + "step": 24680 + }, + { + "epoch": 2.41, + "learning_rate": 2.1968170495433158e-05, + "loss": 0.111, + "step": 24685 + }, + { + "epoch": 2.41, + "learning_rate": 2.196401882092444e-05, + "loss": 0.1471, + "step": 24690 + }, + { + "epoch": 2.41, + "learning_rate": 2.1959867146415723e-05, + "loss": 0.1202, + "step": 24695 + }, + { + "epoch": 2.42, + "learning_rate": 2.1955715471907003e-05, + "loss": 0.1093, + "step": 24700 + }, + { + "epoch": 2.42, + "learning_rate": 2.1951563797398284e-05, + "loss": 0.1457, + "step": 24705 + }, + { + "epoch": 2.42, + "learning_rate": 2.1947412122889565e-05, + "loss": 0.1154, + "step": 24710 + }, + { + "epoch": 2.42, + "learning_rate": 2.194326044838085e-05, + "loss": 0.1138, + "step": 24715 + }, + { + "epoch": 2.42, + "learning_rate": 2.193910877387213e-05, + "loss": 0.1178, + "step": 24720 + }, + { + "epoch": 2.42, + "learning_rate": 2.193495709936341e-05, + "loss": 0.1257, + "step": 24725 + }, + { + "epoch": 2.42, + "learning_rate": 2.193080542485469e-05, + "loss": 0.1198, + "step": 24730 + }, + { + "epoch": 2.42, + "learning_rate": 2.1926653750345972e-05, + "loss": 0.1263, + "step": 24735 + }, + { + "epoch": 2.42, + "learning_rate": 2.1922502075837256e-05, + "loss": 0.1682, + "step": 24740 + }, + { + "epoch": 2.42, + "learning_rate": 2.1918350401328537e-05, + "loss": 0.1196, + "step": 24745 + }, + { + "epoch": 2.42, + "learning_rate": 2.1914198726819818e-05, + "loss": 0.1158, + "step": 24750 + }, + { + "epoch": 2.42, + "learning_rate": 2.19100470523111e-05, + "loss": 0.1271, + "step": 24755 + }, + { + "epoch": 2.42, + "learning_rate": 2.190589537780238e-05, + "loss": 0.1234, + "step": 24760 + }, + { + "epoch": 2.42, + "learning_rate": 2.1901743703293663e-05, + "loss": 0.1095, + "step": 24765 + }, + { + "epoch": 2.42, + "learning_rate": 2.1897592028784944e-05, + "loss": 0.1464, + "step": 24770 + }, + { + "epoch": 2.42, + "learning_rate": 2.1893440354276225e-05, + "loss": 0.1398, + "step": 24775 + }, + { + "epoch": 2.42, + "learning_rate": 2.1889288679767506e-05, + "loss": 0.1154, + "step": 24780 + }, + { + "epoch": 2.42, + "learning_rate": 2.188513700525879e-05, + "loss": 0.1245, + "step": 24785 + }, + { + "epoch": 2.42, + "learning_rate": 2.188098533075007e-05, + "loss": 0.1474, + "step": 24790 + }, + { + "epoch": 2.42, + "learning_rate": 2.187683365624135e-05, + "loss": 0.1239, + "step": 24795 + }, + { + "epoch": 2.43, + "learning_rate": 2.1872681981732632e-05, + "loss": 0.1198, + "step": 24800 + }, + { + "epoch": 2.43, + "learning_rate": 2.1868530307223913e-05, + "loss": 0.1434, + "step": 24805 + }, + { + "epoch": 2.43, + "learning_rate": 2.1864378632715194e-05, + "loss": 0.1284, + "step": 24810 + }, + { + "epoch": 2.43, + "learning_rate": 2.1860226958206475e-05, + "loss": 0.0984, + "step": 24815 + }, + { + "epoch": 2.43, + "learning_rate": 2.185607528369776e-05, + "loss": 0.1489, + "step": 24820 + }, + { + "epoch": 2.43, + "learning_rate": 2.1851923609189043e-05, + "loss": 0.1249, + "step": 24825 + }, + { + "epoch": 2.43, + "learning_rate": 2.1847771934680324e-05, + "loss": 0.1148, + "step": 24830 + }, + { + "epoch": 2.43, + "learning_rate": 2.1843620260171604e-05, + "loss": 0.1277, + "step": 24835 + }, + { + "epoch": 2.43, + "learning_rate": 2.1839468585662885e-05, + "loss": 0.1454, + "step": 24840 + }, + { + "epoch": 2.43, + "learning_rate": 2.1835316911154166e-05, + "loss": 0.104, + "step": 24845 + }, + { + "epoch": 2.43, + "learning_rate": 2.1831165236645447e-05, + "loss": 0.1119, + "step": 24850 + }, + { + "epoch": 2.43, + "learning_rate": 2.1827013562136727e-05, + "loss": 0.1442, + "step": 24855 + }, + { + "epoch": 2.43, + "learning_rate": 2.1822861887628008e-05, + "loss": 0.1129, + "step": 24860 + }, + { + "epoch": 2.43, + "learning_rate": 2.181871021311929e-05, + "loss": 0.1271, + "step": 24865 + }, + { + "epoch": 2.43, + "learning_rate": 2.1814558538610577e-05, + "loss": 0.112, + "step": 24870 + }, + { + "epoch": 2.43, + "learning_rate": 2.1810406864101857e-05, + "loss": 0.1412, + "step": 24875 + }, + { + "epoch": 2.43, + "learning_rate": 2.1806255189593138e-05, + "loss": 0.115, + "step": 24880 + }, + { + "epoch": 2.43, + "learning_rate": 2.180210351508442e-05, + "loss": 0.1198, + "step": 24885 + }, + { + "epoch": 2.43, + "learning_rate": 2.17979518405757e-05, + "loss": 0.1394, + "step": 24890 + }, + { + "epoch": 2.43, + "learning_rate": 2.179380016606698e-05, + "loss": 0.1182, + "step": 24895 + }, + { + "epoch": 2.43, + "learning_rate": 2.178964849155826e-05, + "loss": 0.1236, + "step": 24900 + }, + { + "epoch": 2.44, + "learning_rate": 2.1785496817049542e-05, + "loss": 0.1443, + "step": 24905 + }, + { + "epoch": 2.44, + "learning_rate": 2.1781345142540823e-05, + "loss": 0.1265, + "step": 24910 + }, + { + "epoch": 2.44, + "learning_rate": 2.1777193468032107e-05, + "loss": 0.1198, + "step": 24915 + }, + { + "epoch": 2.44, + "learning_rate": 2.177304179352339e-05, + "loss": 0.126, + "step": 24920 + }, + { + "epoch": 2.44, + "learning_rate": 2.1768890119014672e-05, + "loss": 0.1192, + "step": 24925 + }, + { + "epoch": 2.44, + "learning_rate": 2.1764738444505953e-05, + "loss": 0.1011, + "step": 24930 + }, + { + "epoch": 2.44, + "learning_rate": 2.1760586769997233e-05, + "loss": 0.1271, + "step": 24935 + }, + { + "epoch": 2.44, + "learning_rate": 2.1756435095488514e-05, + "loss": 0.1376, + "step": 24940 + }, + { + "epoch": 2.44, + "learning_rate": 2.1752283420979795e-05, + "loss": 0.1064, + "step": 24945 + }, + { + "epoch": 2.44, + "learning_rate": 2.1748131746471076e-05, + "loss": 0.1035, + "step": 24950 + }, + { + "epoch": 2.44, + "learning_rate": 2.1743980071962356e-05, + "loss": 0.1507, + "step": 24955 + }, + { + "epoch": 2.44, + "learning_rate": 2.173982839745364e-05, + "loss": 0.1188, + "step": 24960 + }, + { + "epoch": 2.44, + "learning_rate": 2.173567672294492e-05, + "loss": 0.1036, + "step": 24965 + }, + { + "epoch": 2.44, + "learning_rate": 2.1731525048436205e-05, + "loss": 0.1215, + "step": 24970 + }, + { + "epoch": 2.44, + "learning_rate": 2.1727373373927486e-05, + "loss": 0.1402, + "step": 24975 + }, + { + "epoch": 2.44, + "learning_rate": 2.1723221699418767e-05, + "loss": 0.1241, + "step": 24980 + }, + { + "epoch": 2.44, + "learning_rate": 2.1719070024910048e-05, + "loss": 0.1095, + "step": 24985 + }, + { + "epoch": 2.44, + "learning_rate": 2.171491835040133e-05, + "loss": 0.1444, + "step": 24990 + }, + { + "epoch": 2.44, + "learning_rate": 2.171076667589261e-05, + "loss": 0.1174, + "step": 24995 + }, + { + "epoch": 2.44, + "learning_rate": 2.170661500138389e-05, + "loss": 0.1133, + "step": 25000 + }, + { + "epoch": 2.44, + "eval_cer": 0.06142955250178625, + "eval_loss": 0.25334686040878296, + "eval_runtime": 273.914, + "eval_samples_per_second": 59.763, + "eval_steps_per_second": 1.661, + "eval_wer": 0.15655955544817587, + "step": 25000 + }, + { + "epoch": 2.45, + "learning_rate": 2.1702463326875174e-05, + "loss": 0.1216, + "step": 25005 + }, + { + "epoch": 2.45, + "learning_rate": 2.1698311652366455e-05, + "loss": 0.142, + "step": 25010 + }, + { + "epoch": 2.45, + "learning_rate": 2.1694159977857736e-05, + "loss": 0.1066, + "step": 25015 + }, + { + "epoch": 2.45, + "learning_rate": 2.1690008303349017e-05, + "loss": 0.1059, + "step": 25020 + }, + { + "epoch": 2.45, + "learning_rate": 2.16858566288403e-05, + "loss": 0.1376, + "step": 25025 + }, + { + "epoch": 2.45, + "learning_rate": 2.168170495433158e-05, + "loss": 0.1174, + "step": 25030 + }, + { + "epoch": 2.45, + "learning_rate": 2.1677553279822862e-05, + "loss": 0.1202, + "step": 25035 + }, + { + "epoch": 2.45, + "learning_rate": 2.1673401605314143e-05, + "loss": 0.1577, + "step": 25040 + }, + { + "epoch": 2.45, + "learning_rate": 2.1669249930805427e-05, + "loss": 0.1234, + "step": 25045 + }, + { + "epoch": 2.45, + "learning_rate": 2.1665098256296708e-05, + "loss": 0.1101, + "step": 25050 + }, + { + "epoch": 2.45, + "learning_rate": 2.166094658178799e-05, + "loss": 0.1395, + "step": 25055 + }, + { + "epoch": 2.45, + "learning_rate": 2.165679490727927e-05, + "loss": 0.1132, + "step": 25060 + }, + { + "epoch": 2.45, + "learning_rate": 2.165264323277055e-05, + "loss": 0.1181, + "step": 25065 + }, + { + "epoch": 2.45, + "learning_rate": 2.164849155826183e-05, + "loss": 0.1225, + "step": 25070 + }, + { + "epoch": 2.45, + "learning_rate": 2.1644339883753115e-05, + "loss": 0.1447, + "step": 25075 + }, + { + "epoch": 2.45, + "learning_rate": 2.1640188209244396e-05, + "loss": 0.1225, + "step": 25080 + }, + { + "epoch": 2.45, + "learning_rate": 2.1636036534735677e-05, + "loss": 0.1158, + "step": 25085 + }, + { + "epoch": 2.45, + "learning_rate": 2.163188486022696e-05, + "loss": 0.1594, + "step": 25090 + }, + { + "epoch": 2.45, + "learning_rate": 2.162773318571824e-05, + "loss": 0.1241, + "step": 25095 + }, + { + "epoch": 2.45, + "learning_rate": 2.1623581511209522e-05, + "loss": 0.1159, + "step": 25100 + }, + { + "epoch": 2.45, + "learning_rate": 2.1619429836700803e-05, + "loss": 0.135, + "step": 25105 + }, + { + "epoch": 2.46, + "learning_rate": 2.1615278162192084e-05, + "loss": 0.1209, + "step": 25110 + }, + { + "epoch": 2.46, + "learning_rate": 2.1611126487683365e-05, + "loss": 0.1135, + "step": 25115 + }, + { + "epoch": 2.46, + "learning_rate": 2.1606974813174645e-05, + "loss": 0.1496, + "step": 25120 + }, + { + "epoch": 2.46, + "learning_rate": 2.160282313866593e-05, + "loss": 0.1331, + "step": 25125 + }, + { + "epoch": 2.46, + "learning_rate": 2.159867146415721e-05, + "loss": 0.1053, + "step": 25130 + }, + { + "epoch": 2.46, + "learning_rate": 2.1594519789648495e-05, + "loss": 0.1321, + "step": 25135 + }, + { + "epoch": 2.46, + "learning_rate": 2.1590368115139775e-05, + "loss": 0.1395, + "step": 25140 + }, + { + "epoch": 2.46, + "learning_rate": 2.1586216440631056e-05, + "loss": 0.1067, + "step": 25145 + }, + { + "epoch": 2.46, + "learning_rate": 2.1582064766122337e-05, + "loss": 0.1186, + "step": 25150 + }, + { + "epoch": 2.46, + "learning_rate": 2.1577913091613618e-05, + "loss": 0.1472, + "step": 25155 + }, + { + "epoch": 2.46, + "learning_rate": 2.15737614171049e-05, + "loss": 0.1304, + "step": 25160 + }, + { + "epoch": 2.46, + "learning_rate": 2.156960974259618e-05, + "loss": 0.1223, + "step": 25165 + }, + { + "epoch": 2.46, + "learning_rate": 2.156545806808746e-05, + "loss": 0.1379, + "step": 25170 + }, + { + "epoch": 2.46, + "learning_rate": 2.1561306393578744e-05, + "loss": 0.1395, + "step": 25175 + }, + { + "epoch": 2.46, + "learning_rate": 2.1557154719070028e-05, + "loss": 0.1272, + "step": 25180 + }, + { + "epoch": 2.46, + "learning_rate": 2.155300304456131e-05, + "loss": 0.1288, + "step": 25185 + }, + { + "epoch": 2.46, + "learning_rate": 2.154885137005259e-05, + "loss": 0.1438, + "step": 25190 + }, + { + "epoch": 2.46, + "learning_rate": 2.154469969554387e-05, + "loss": 0.1266, + "step": 25195 + }, + { + "epoch": 2.46, + "learning_rate": 2.154054802103515e-05, + "loss": 0.1236, + "step": 25200 + }, + { + "epoch": 2.46, + "learning_rate": 2.1536396346526432e-05, + "loss": 0.1215, + "step": 25205 + }, + { + "epoch": 2.47, + "learning_rate": 2.1532244672017713e-05, + "loss": 0.1303, + "step": 25210 + }, + { + "epoch": 2.47, + "learning_rate": 2.1528092997508994e-05, + "loss": 0.1153, + "step": 25215 + }, + { + "epoch": 2.47, + "learning_rate": 2.1523941323000274e-05, + "loss": 0.1272, + "step": 25220 + }, + { + "epoch": 2.47, + "learning_rate": 2.151978964849156e-05, + "loss": 0.1436, + "step": 25225 + }, + { + "epoch": 2.47, + "learning_rate": 2.1515637973982843e-05, + "loss": 0.133, + "step": 25230 + }, + { + "epoch": 2.47, + "learning_rate": 2.1511486299474123e-05, + "loss": 0.1262, + "step": 25235 + }, + { + "epoch": 2.47, + "learning_rate": 2.1507334624965404e-05, + "loss": 0.1625, + "step": 25240 + }, + { + "epoch": 2.47, + "learning_rate": 2.1503182950456685e-05, + "loss": 0.13, + "step": 25245 + }, + { + "epoch": 2.47, + "learning_rate": 2.1499031275947966e-05, + "loss": 0.1156, + "step": 25250 + }, + { + "epoch": 2.47, + "learning_rate": 2.1494879601439247e-05, + "loss": 0.1352, + "step": 25255 + }, + { + "epoch": 2.47, + "learning_rate": 2.1490727926930527e-05, + "loss": 0.1143, + "step": 25260 + }, + { + "epoch": 2.47, + "learning_rate": 2.148657625242181e-05, + "loss": 0.117, + "step": 25265 + }, + { + "epoch": 2.47, + "learning_rate": 2.1482424577913092e-05, + "loss": 0.1129, + "step": 25270 + }, + { + "epoch": 2.47, + "learning_rate": 2.1478272903404373e-05, + "loss": 0.1279, + "step": 25275 + }, + { + "epoch": 2.47, + "learning_rate": 2.1474121228895657e-05, + "loss": 0.1142, + "step": 25280 + }, + { + "epoch": 2.47, + "learning_rate": 2.1469969554386938e-05, + "loss": 0.1151, + "step": 25285 + }, + { + "epoch": 2.47, + "learning_rate": 2.146581787987822e-05, + "loss": 0.14, + "step": 25290 + }, + { + "epoch": 2.47, + "learning_rate": 2.14616662053695e-05, + "loss": 0.1254, + "step": 25295 + }, + { + "epoch": 2.47, + "learning_rate": 2.145751453086078e-05, + "loss": 0.1337, + "step": 25300 + }, + { + "epoch": 2.47, + "learning_rate": 2.145336285635206e-05, + "loss": 0.1408, + "step": 25305 + }, + { + "epoch": 2.47, + "learning_rate": 2.1449211181843345e-05, + "loss": 0.1248, + "step": 25310 + }, + { + "epoch": 2.48, + "learning_rate": 2.1445059507334626e-05, + "loss": 0.1175, + "step": 25315 + }, + { + "epoch": 2.48, + "learning_rate": 2.1440907832825907e-05, + "loss": 0.1412, + "step": 25320 + }, + { + "epoch": 2.48, + "learning_rate": 2.1436756158317187e-05, + "loss": 0.1354, + "step": 25325 + }, + { + "epoch": 2.48, + "learning_rate": 2.143260448380847e-05, + "loss": 0.1169, + "step": 25330 + }, + { + "epoch": 2.48, + "learning_rate": 2.1428452809299752e-05, + "loss": 0.1184, + "step": 25335 + }, + { + "epoch": 2.48, + "learning_rate": 2.1424301134791033e-05, + "loss": 0.1499, + "step": 25340 + }, + { + "epoch": 2.48, + "learning_rate": 2.1420149460282314e-05, + "loss": 0.1178, + "step": 25345 + }, + { + "epoch": 2.48, + "learning_rate": 2.1415997785773595e-05, + "loss": 0.1112, + "step": 25350 + }, + { + "epoch": 2.48, + "learning_rate": 2.141184611126488e-05, + "loss": 0.1455, + "step": 25355 + }, + { + "epoch": 2.48, + "learning_rate": 2.140769443675616e-05, + "loss": 0.1302, + "step": 25360 + }, + { + "epoch": 2.48, + "learning_rate": 2.140354276224744e-05, + "loss": 0.1214, + "step": 25365 + }, + { + "epoch": 2.48, + "learning_rate": 2.139939108773872e-05, + "loss": 0.1308, + "step": 25370 + }, + { + "epoch": 2.48, + "learning_rate": 2.1395239413230002e-05, + "loss": 0.14, + "step": 25375 + }, + { + "epoch": 2.48, + "learning_rate": 2.1391087738721286e-05, + "loss": 0.1208, + "step": 25380 + }, + { + "epoch": 2.48, + "learning_rate": 2.1386936064212567e-05, + "loss": 0.1051, + "step": 25385 + }, + { + "epoch": 2.48, + "learning_rate": 2.1382784389703848e-05, + "loss": 0.1678, + "step": 25390 + }, + { + "epoch": 2.48, + "learning_rate": 2.137863271519513e-05, + "loss": 0.1254, + "step": 25395 + }, + { + "epoch": 2.48, + "learning_rate": 2.1374481040686413e-05, + "loss": 0.1128, + "step": 25400 + }, + { + "epoch": 2.48, + "learning_rate": 2.1370329366177693e-05, + "loss": 0.1377, + "step": 25405 + }, + { + "epoch": 2.48, + "learning_rate": 2.1366177691668974e-05, + "loss": 0.1335, + "step": 25410 + }, + { + "epoch": 2.49, + "learning_rate": 2.1362026017160255e-05, + "loss": 0.1241, + "step": 25415 + }, + { + "epoch": 2.49, + "learning_rate": 2.1357874342651536e-05, + "loss": 0.1236, + "step": 25420 + }, + { + "epoch": 2.49, + "learning_rate": 2.1353722668142816e-05, + "loss": 0.1412, + "step": 25425 + }, + { + "epoch": 2.49, + "learning_rate": 2.1349570993634097e-05, + "loss": 0.1109, + "step": 25430 + }, + { + "epoch": 2.49, + "learning_rate": 2.134541931912538e-05, + "loss": 0.1187, + "step": 25435 + }, + { + "epoch": 2.49, + "learning_rate": 2.1341267644616662e-05, + "loss": 0.1509, + "step": 25440 + }, + { + "epoch": 2.49, + "learning_rate": 2.1337115970107946e-05, + "loss": 0.1102, + "step": 25445 + }, + { + "epoch": 2.49, + "learning_rate": 2.1332964295599227e-05, + "loss": 0.1113, + "step": 25450 + }, + { + "epoch": 2.49, + "learning_rate": 2.1328812621090508e-05, + "loss": 0.1342, + "step": 25455 + }, + { + "epoch": 2.49, + "learning_rate": 2.132466094658179e-05, + "loss": 0.1243, + "step": 25460 + }, + { + "epoch": 2.49, + "learning_rate": 2.132050927207307e-05, + "loss": 0.1073, + "step": 25465 + }, + { + "epoch": 2.49, + "learning_rate": 2.131635759756435e-05, + "loss": 0.1295, + "step": 25470 + }, + { + "epoch": 2.49, + "learning_rate": 2.131220592305563e-05, + "loss": 0.1325, + "step": 25475 + }, + { + "epoch": 2.49, + "learning_rate": 2.130805424854691e-05, + "loss": 0.1004, + "step": 25480 + }, + { + "epoch": 2.49, + "learning_rate": 2.1303902574038196e-05, + "loss": 0.13, + "step": 25485 + }, + { + "epoch": 2.49, + "learning_rate": 2.129975089952948e-05, + "loss": 0.164, + "step": 25490 + }, + { + "epoch": 2.49, + "learning_rate": 2.129559922502076e-05, + "loss": 0.1347, + "step": 25495 + }, + { + "epoch": 2.49, + "learning_rate": 2.129144755051204e-05, + "loss": 0.1135, + "step": 25500 + }, + { + "epoch": 2.49, + "eval_cer": 0.06055319316208486, + "eval_loss": 0.24695424735546112, + "eval_runtime": 278.0489, + "eval_samples_per_second": 58.875, + "eval_steps_per_second": 1.636, + "eval_wer": 0.15605675740974123, + "step": 25500 + }, + { + "epoch": 2.49, + "learning_rate": 2.1287295876003322e-05, + "loss": 0.1524, + "step": 25505 + }, + { + "epoch": 2.49, + "learning_rate": 2.1283144201494603e-05, + "loss": 0.117, + "step": 25510 + }, + { + "epoch": 2.49, + "learning_rate": 2.1278992526985884e-05, + "loss": 0.1163, + "step": 25515 + }, + { + "epoch": 2.5, + "learning_rate": 2.1274840852477165e-05, + "loss": 0.1349, + "step": 25520 + }, + { + "epoch": 2.5, + "learning_rate": 2.1270689177968445e-05, + "loss": 0.1359, + "step": 25525 + }, + { + "epoch": 2.5, + "learning_rate": 2.126653750345973e-05, + "loss": 0.1181, + "step": 25530 + }, + { + "epoch": 2.5, + "learning_rate": 2.1262385828951014e-05, + "loss": 0.1212, + "step": 25535 + }, + { + "epoch": 2.5, + "learning_rate": 2.1258234154442294e-05, + "loss": 0.1343, + "step": 25540 + }, + { + "epoch": 2.5, + "learning_rate": 2.1254082479933575e-05, + "loss": 0.1119, + "step": 25545 + }, + { + "epoch": 2.5, + "learning_rate": 2.1249930805424856e-05, + "loss": 0.1144, + "step": 25550 + }, + { + "epoch": 2.5, + "learning_rate": 2.1245779130916137e-05, + "loss": 0.1343, + "step": 25555 + }, + { + "epoch": 2.5, + "learning_rate": 2.1241627456407417e-05, + "loss": 0.1307, + "step": 25560 + }, + { + "epoch": 2.5, + "learning_rate": 2.1237475781898698e-05, + "loss": 0.1094, + "step": 25565 + }, + { + "epoch": 2.5, + "learning_rate": 2.123332410738998e-05, + "loss": 0.1174, + "step": 25570 + }, + { + "epoch": 2.5, + "learning_rate": 2.1229172432881263e-05, + "loss": 0.1211, + "step": 25575 + }, + { + "epoch": 2.5, + "learning_rate": 2.1225020758372544e-05, + "loss": 0.1132, + "step": 25580 + }, + { + "epoch": 2.5, + "learning_rate": 2.1220869083863828e-05, + "loss": 0.1219, + "step": 25585 + }, + { + "epoch": 2.5, + "learning_rate": 2.121671740935511e-05, + "loss": 0.1314, + "step": 25590 + }, + { + "epoch": 2.5, + "learning_rate": 2.121256573484639e-05, + "loss": 0.1139, + "step": 25595 + }, + { + "epoch": 2.5, + "learning_rate": 2.120841406033767e-05, + "loss": 0.1161, + "step": 25600 + }, + { + "epoch": 2.5, + "learning_rate": 2.120426238582895e-05, + "loss": 0.1523, + "step": 25605 + }, + { + "epoch": 2.5, + "learning_rate": 2.1200110711320232e-05, + "loss": 0.1191, + "step": 25610 + }, + { + "epoch": 2.5, + "learning_rate": 2.1195959036811513e-05, + "loss": 0.1214, + "step": 25615 + }, + { + "epoch": 2.51, + "learning_rate": 2.1191807362302797e-05, + "loss": 0.125, + "step": 25620 + }, + { + "epoch": 2.51, + "learning_rate": 2.1187655687794078e-05, + "loss": 0.125, + "step": 25625 + }, + { + "epoch": 2.51, + "learning_rate": 2.118350401328536e-05, + "loss": 0.1073, + "step": 25630 + }, + { + "epoch": 2.51, + "learning_rate": 2.117935233877664e-05, + "loss": 0.1149, + "step": 25635 + }, + { + "epoch": 2.51, + "learning_rate": 2.1175200664267923e-05, + "loss": 0.1287, + "step": 25640 + }, + { + "epoch": 2.51, + "learning_rate": 2.1171048989759204e-05, + "loss": 0.1087, + "step": 25645 + }, + { + "epoch": 2.51, + "learning_rate": 2.1166897315250485e-05, + "loss": 0.1149, + "step": 25650 + }, + { + "epoch": 2.51, + "learning_rate": 2.1162745640741766e-05, + "loss": 0.1153, + "step": 25655 + }, + { + "epoch": 2.51, + "learning_rate": 2.1158593966233046e-05, + "loss": 0.1256, + "step": 25660 + }, + { + "epoch": 2.51, + "learning_rate": 2.115444229172433e-05, + "loss": 0.1365, + "step": 25665 + }, + { + "epoch": 2.51, + "learning_rate": 2.115029061721561e-05, + "loss": 0.1025, + "step": 25670 + }, + { + "epoch": 2.51, + "learning_rate": 2.1146138942706892e-05, + "loss": 0.1314, + "step": 25675 + }, + { + "epoch": 2.51, + "learning_rate": 2.1141987268198173e-05, + "loss": 0.1101, + "step": 25680 + }, + { + "epoch": 2.51, + "learning_rate": 2.1137835593689454e-05, + "loss": 0.1184, + "step": 25685 + }, + { + "epoch": 2.51, + "learning_rate": 2.1133683919180738e-05, + "loss": 0.1608, + "step": 25690 + }, + { + "epoch": 2.51, + "learning_rate": 2.112953224467202e-05, + "loss": 0.1222, + "step": 25695 + }, + { + "epoch": 2.51, + "learning_rate": 2.11253805701633e-05, + "loss": 0.13, + "step": 25700 + }, + { + "epoch": 2.51, + "learning_rate": 2.112122889565458e-05, + "loss": 0.1478, + "step": 25705 + }, + { + "epoch": 2.51, + "learning_rate": 2.1117077221145864e-05, + "loss": 0.1215, + "step": 25710 + }, + { + "epoch": 2.51, + "learning_rate": 2.1112925546637145e-05, + "loss": 0.1306, + "step": 25715 + }, + { + "epoch": 2.51, + "learning_rate": 2.1108773872128426e-05, + "loss": 0.1249, + "step": 25720 + }, + { + "epoch": 2.52, + "learning_rate": 2.1104622197619707e-05, + "loss": 0.1522, + "step": 25725 + }, + { + "epoch": 2.52, + "learning_rate": 2.1100470523110987e-05, + "loss": 0.1097, + "step": 25730 + }, + { + "epoch": 2.52, + "learning_rate": 2.1096318848602268e-05, + "loss": 0.1015, + "step": 25735 + }, + { + "epoch": 2.52, + "learning_rate": 2.1092167174093552e-05, + "loss": 0.133, + "step": 25740 + }, + { + "epoch": 2.52, + "learning_rate": 2.1088015499584833e-05, + "loss": 0.1307, + "step": 25745 + }, + { + "epoch": 2.52, + "learning_rate": 2.1083863825076117e-05, + "loss": 0.1185, + "step": 25750 + }, + { + "epoch": 2.52, + "learning_rate": 2.1079712150567398e-05, + "loss": 0.1603, + "step": 25755 + }, + { + "epoch": 2.52, + "learning_rate": 2.107556047605868e-05, + "loss": 0.1228, + "step": 25760 + }, + { + "epoch": 2.52, + "learning_rate": 2.107140880154996e-05, + "loss": 0.1125, + "step": 25765 + }, + { + "epoch": 2.52, + "learning_rate": 2.106725712704124e-05, + "loss": 0.1173, + "step": 25770 + }, + { + "epoch": 2.52, + "learning_rate": 2.106310545253252e-05, + "loss": 0.1286, + "step": 25775 + }, + { + "epoch": 2.52, + "learning_rate": 2.1058953778023802e-05, + "loss": 0.1226, + "step": 25780 + }, + { + "epoch": 2.52, + "learning_rate": 2.1054802103515083e-05, + "loss": 0.1202, + "step": 25785 + }, + { + "epoch": 2.52, + "learning_rate": 2.1050650429006367e-05, + "loss": 0.1477, + "step": 25790 + }, + { + "epoch": 2.52, + "learning_rate": 2.104649875449765e-05, + "loss": 0.1317, + "step": 25795 + }, + { + "epoch": 2.52, + "learning_rate": 2.104234707998893e-05, + "loss": 0.1245, + "step": 25800 + }, + { + "epoch": 2.52, + "learning_rate": 2.1038195405480212e-05, + "loss": 0.1449, + "step": 25805 + }, + { + "epoch": 2.52, + "learning_rate": 2.1034043730971493e-05, + "loss": 0.1204, + "step": 25810 + }, + { + "epoch": 2.52, + "learning_rate": 2.1029892056462774e-05, + "loss": 0.1107, + "step": 25815 + }, + { + "epoch": 2.52, + "learning_rate": 2.1025740381954055e-05, + "loss": 0.1239, + "step": 25820 + }, + { + "epoch": 2.53, + "learning_rate": 2.1021588707445335e-05, + "loss": 0.133, + "step": 25825 + }, + { + "epoch": 2.53, + "learning_rate": 2.1017437032936616e-05, + "loss": 0.1217, + "step": 25830 + }, + { + "epoch": 2.53, + "learning_rate": 2.1013285358427897e-05, + "loss": 0.1181, + "step": 25835 + }, + { + "epoch": 2.53, + "learning_rate": 2.100913368391918e-05, + "loss": 0.1225, + "step": 25840 + }, + { + "epoch": 2.53, + "learning_rate": 2.1004982009410465e-05, + "loss": 0.1193, + "step": 25845 + }, + { + "epoch": 2.53, + "learning_rate": 2.1000830334901746e-05, + "loss": 0.1186, + "step": 25850 + }, + { + "epoch": 2.53, + "learning_rate": 2.0996678660393027e-05, + "loss": 0.1397, + "step": 25855 + }, + { + "epoch": 2.53, + "learning_rate": 2.0992526985884308e-05, + "loss": 0.1249, + "step": 25860 + }, + { + "epoch": 2.53, + "learning_rate": 2.098837531137559e-05, + "loss": 0.1055, + "step": 25865 + }, + { + "epoch": 2.53, + "learning_rate": 2.098422363686687e-05, + "loss": 0.1199, + "step": 25870 + }, + { + "epoch": 2.53, + "learning_rate": 2.098007196235815e-05, + "loss": 0.1394, + "step": 25875 + }, + { + "epoch": 2.53, + "learning_rate": 2.097592028784943e-05, + "loss": 0.117, + "step": 25880 + }, + { + "epoch": 2.53, + "learning_rate": 2.0971768613340715e-05, + "loss": 0.1183, + "step": 25885 + }, + { + "epoch": 2.53, + "learning_rate": 2.0967616938831996e-05, + "loss": 0.144, + "step": 25890 + }, + { + "epoch": 2.53, + "learning_rate": 2.096346526432328e-05, + "loss": 0.1145, + "step": 25895 + }, + { + "epoch": 2.53, + "learning_rate": 2.095931358981456e-05, + "loss": 0.108, + "step": 25900 + }, + { + "epoch": 2.53, + "learning_rate": 2.095516191530584e-05, + "loss": 0.1385, + "step": 25905 + }, + { + "epoch": 2.53, + "learning_rate": 2.0951010240797122e-05, + "loss": 0.1265, + "step": 25910 + }, + { + "epoch": 2.53, + "learning_rate": 2.0946858566288403e-05, + "loss": 0.1166, + "step": 25915 + }, + { + "epoch": 2.53, + "learning_rate": 2.0942706891779684e-05, + "loss": 0.1164, + "step": 25920 + }, + { + "epoch": 2.54, + "learning_rate": 2.0938555217270964e-05, + "loss": 0.1266, + "step": 25925 + }, + { + "epoch": 2.54, + "learning_rate": 2.093440354276225e-05, + "loss": 0.1026, + "step": 25930 + }, + { + "epoch": 2.54, + "learning_rate": 2.093025186825353e-05, + "loss": 0.1233, + "step": 25935 + }, + { + "epoch": 2.54, + "learning_rate": 2.092610019374481e-05, + "loss": 0.1385, + "step": 25940 + }, + { + "epoch": 2.54, + "learning_rate": 2.0921948519236094e-05, + "loss": 0.1312, + "step": 25945 + }, + { + "epoch": 2.54, + "learning_rate": 2.0917796844727375e-05, + "loss": 0.1167, + "step": 25950 + }, + { + "epoch": 2.54, + "learning_rate": 2.0913645170218656e-05, + "loss": 0.1362, + "step": 25955 + }, + { + "epoch": 2.54, + "learning_rate": 2.0909493495709937e-05, + "loss": 0.128, + "step": 25960 + }, + { + "epoch": 2.54, + "learning_rate": 2.0905341821201217e-05, + "loss": 0.1165, + "step": 25965 + }, + { + "epoch": 2.54, + "learning_rate": 2.09011901466925e-05, + "loss": 0.1405, + "step": 25970 + }, + { + "epoch": 2.54, + "learning_rate": 2.0897038472183782e-05, + "loss": 0.1327, + "step": 25975 + }, + { + "epoch": 2.54, + "learning_rate": 2.0892886797675063e-05, + "loss": 0.1147, + "step": 25980 + }, + { + "epoch": 2.54, + "learning_rate": 2.0888735123166344e-05, + "loss": 0.1271, + "step": 25985 + }, + { + "epoch": 2.54, + "learning_rate": 2.0884583448657625e-05, + "loss": 0.1479, + "step": 25990 + }, + { + "epoch": 2.54, + "learning_rate": 2.088043177414891e-05, + "loss": 0.1187, + "step": 25995 + }, + { + "epoch": 2.54, + "learning_rate": 2.087628009964019e-05, + "loss": 0.1042, + "step": 26000 + }, + { + "epoch": 2.54, + "eval_cer": 0.06035317975078098, + "eval_loss": 0.25076889991760254, + "eval_runtime": 272.3631, + "eval_samples_per_second": 60.104, + "eval_steps_per_second": 1.671, + "eval_wer": 0.1545744826730572, + "step": 26000 + }, + { + "epoch": 2.54, + "learning_rate": 2.087212842513147e-05, + "loss": 0.1364, + "step": 26005 + }, + { + "epoch": 2.54, + "learning_rate": 2.086797675062275e-05, + "loss": 0.129, + "step": 26010 + }, + { + "epoch": 2.54, + "learning_rate": 2.0863825076114035e-05, + "loss": 0.1127, + "step": 26015 + }, + { + "epoch": 2.54, + "learning_rate": 2.0859673401605316e-05, + "loss": 0.1129, + "step": 26020 + }, + { + "epoch": 2.54, + "learning_rate": 2.0855521727096597e-05, + "loss": 0.1318, + "step": 26025 + }, + { + "epoch": 2.55, + "learning_rate": 2.0851370052587877e-05, + "loss": 0.117, + "step": 26030 + }, + { + "epoch": 2.55, + "learning_rate": 2.0847218378079158e-05, + "loss": 0.1153, + "step": 26035 + }, + { + "epoch": 2.55, + "learning_rate": 2.084306670357044e-05, + "loss": 0.1614, + "step": 26040 + }, + { + "epoch": 2.55, + "learning_rate": 2.083891502906172e-05, + "loss": 0.1149, + "step": 26045 + }, + { + "epoch": 2.55, + "learning_rate": 2.0834763354553004e-05, + "loss": 0.1112, + "step": 26050 + }, + { + "epoch": 2.55, + "learning_rate": 2.0830611680044285e-05, + "loss": 0.1507, + "step": 26055 + }, + { + "epoch": 2.55, + "learning_rate": 2.082646000553557e-05, + "loss": 0.1326, + "step": 26060 + }, + { + "epoch": 2.55, + "learning_rate": 2.082230833102685e-05, + "loss": 0.1107, + "step": 26065 + }, + { + "epoch": 2.55, + "learning_rate": 2.081815665651813e-05, + "loss": 0.1344, + "step": 26070 + }, + { + "epoch": 2.55, + "learning_rate": 2.081400498200941e-05, + "loss": 0.1315, + "step": 26075 + }, + { + "epoch": 2.55, + "learning_rate": 2.0809853307500692e-05, + "loss": 0.1269, + "step": 26080 + }, + { + "epoch": 2.55, + "learning_rate": 2.0805701632991973e-05, + "loss": 0.1173, + "step": 26085 + }, + { + "epoch": 2.55, + "learning_rate": 2.0801549958483253e-05, + "loss": 0.1333, + "step": 26090 + }, + { + "epoch": 2.55, + "learning_rate": 2.0797398283974534e-05, + "loss": 0.1177, + "step": 26095 + }, + { + "epoch": 2.55, + "learning_rate": 2.079324660946582e-05, + "loss": 0.1089, + "step": 26100 + }, + { + "epoch": 2.55, + "learning_rate": 2.0789094934957103e-05, + "loss": 0.1448, + "step": 26105 + }, + { + "epoch": 2.55, + "learning_rate": 2.0784943260448383e-05, + "loss": 0.1302, + "step": 26110 + }, + { + "epoch": 2.55, + "learning_rate": 2.0780791585939664e-05, + "loss": 0.1024, + "step": 26115 + }, + { + "epoch": 2.55, + "learning_rate": 2.0776639911430945e-05, + "loss": 0.1072, + "step": 26120 + }, + { + "epoch": 2.55, + "learning_rate": 2.0772488236922226e-05, + "loss": 0.1362, + "step": 26125 + }, + { + "epoch": 2.56, + "learning_rate": 2.0768336562413506e-05, + "loss": 0.0994, + "step": 26130 + }, + { + "epoch": 2.56, + "learning_rate": 2.0764184887904787e-05, + "loss": 0.1213, + "step": 26135 + }, + { + "epoch": 2.56, + "learning_rate": 2.0760033213396068e-05, + "loss": 0.1374, + "step": 26140 + }, + { + "epoch": 2.56, + "learning_rate": 2.075588153888735e-05, + "loss": 0.1187, + "step": 26145 + }, + { + "epoch": 2.56, + "learning_rate": 2.0751729864378636e-05, + "loss": 0.1041, + "step": 26150 + }, + { + "epoch": 2.56, + "learning_rate": 2.0747578189869917e-05, + "loss": 0.1372, + "step": 26155 + }, + { + "epoch": 2.56, + "learning_rate": 2.0743426515361198e-05, + "loss": 0.1157, + "step": 26160 + }, + { + "epoch": 2.56, + "learning_rate": 2.073927484085248e-05, + "loss": 0.1028, + "step": 26165 + }, + { + "epoch": 2.56, + "learning_rate": 2.073512316634376e-05, + "loss": 0.1268, + "step": 26170 + }, + { + "epoch": 2.56, + "learning_rate": 2.073097149183504e-05, + "loss": 0.127, + "step": 26175 + }, + { + "epoch": 2.56, + "learning_rate": 2.072681981732632e-05, + "loss": 0.1084, + "step": 26180 + }, + { + "epoch": 2.56, + "learning_rate": 2.07226681428176e-05, + "loss": 0.13, + "step": 26185 + }, + { + "epoch": 2.56, + "learning_rate": 2.0718516468308882e-05, + "loss": 0.1373, + "step": 26190 + }, + { + "epoch": 2.56, + "learning_rate": 2.0714364793800167e-05, + "loss": 0.1193, + "step": 26195 + }, + { + "epoch": 2.56, + "learning_rate": 2.071021311929145e-05, + "loss": 0.1078, + "step": 26200 + }, + { + "epoch": 2.56, + "learning_rate": 2.070606144478273e-05, + "loss": 0.1313, + "step": 26205 + }, + { + "epoch": 2.56, + "learning_rate": 2.0701909770274012e-05, + "loss": 0.1258, + "step": 26210 + }, + { + "epoch": 2.56, + "learning_rate": 2.0697758095765293e-05, + "loss": 0.1259, + "step": 26215 + }, + { + "epoch": 2.56, + "learning_rate": 2.0693606421256574e-05, + "loss": 0.1353, + "step": 26220 + }, + { + "epoch": 2.56, + "learning_rate": 2.0689454746747855e-05, + "loss": 0.1432, + "step": 26225 + }, + { + "epoch": 2.56, + "learning_rate": 2.0685303072239135e-05, + "loss": 0.1193, + "step": 26230 + }, + { + "epoch": 2.57, + "learning_rate": 2.068115139773042e-05, + "loss": 0.1226, + "step": 26235 + }, + { + "epoch": 2.57, + "learning_rate": 2.06769997232217e-05, + "loss": 0.1388, + "step": 26240 + }, + { + "epoch": 2.57, + "learning_rate": 2.067284804871298e-05, + "loss": 0.1231, + "step": 26245 + }, + { + "epoch": 2.57, + "learning_rate": 2.0668696374204262e-05, + "loss": 0.1221, + "step": 26250 + }, + { + "epoch": 2.57, + "learning_rate": 2.0664544699695546e-05, + "loss": 0.1304, + "step": 26255 + }, + { + "epoch": 2.57, + "learning_rate": 2.0660393025186827e-05, + "loss": 0.1188, + "step": 26260 + }, + { + "epoch": 2.57, + "learning_rate": 2.0656241350678107e-05, + "loss": 0.1195, + "step": 26265 + }, + { + "epoch": 2.57, + "learning_rate": 2.0652089676169388e-05, + "loss": 0.1313, + "step": 26270 + }, + { + "epoch": 2.57, + "learning_rate": 2.064793800166067e-05, + "loss": 0.1393, + "step": 26275 + }, + { + "epoch": 2.57, + "learning_rate": 2.0643786327151953e-05, + "loss": 0.1023, + "step": 26280 + }, + { + "epoch": 2.57, + "learning_rate": 2.0639634652643234e-05, + "loss": 0.129, + "step": 26285 + }, + { + "epoch": 2.57, + "learning_rate": 2.0635482978134515e-05, + "loss": 0.1444, + "step": 26290 + }, + { + "epoch": 2.57, + "learning_rate": 2.0631331303625795e-05, + "loss": 0.1144, + "step": 26295 + }, + { + "epoch": 2.57, + "learning_rate": 2.0627179629117076e-05, + "loss": 0.1102, + "step": 26300 + }, + { + "epoch": 2.57, + "learning_rate": 2.062302795460836e-05, + "loss": 0.1432, + "step": 26305 + }, + { + "epoch": 2.57, + "learning_rate": 2.061887628009964e-05, + "loss": 0.1422, + "step": 26310 + }, + { + "epoch": 2.57, + "learning_rate": 2.0614724605590922e-05, + "loss": 0.1189, + "step": 26315 + }, + { + "epoch": 2.57, + "learning_rate": 2.0610572931082203e-05, + "loss": 0.1264, + "step": 26320 + }, + { + "epoch": 2.57, + "learning_rate": 2.0606421256573487e-05, + "loss": 0.1233, + "step": 26325 + }, + { + "epoch": 2.57, + "learning_rate": 2.0602269582064768e-05, + "loss": 0.1067, + "step": 26330 + }, + { + "epoch": 2.58, + "learning_rate": 2.059811790755605e-05, + "loss": 0.1293, + "step": 26335 + }, + { + "epoch": 2.58, + "learning_rate": 2.059396623304733e-05, + "loss": 0.1543, + "step": 26340 + }, + { + "epoch": 2.58, + "learning_rate": 2.058981455853861e-05, + "loss": 0.1139, + "step": 26345 + }, + { + "epoch": 2.58, + "learning_rate": 2.058566288402989e-05, + "loss": 0.1181, + "step": 26350 + }, + { + "epoch": 2.58, + "learning_rate": 2.0581511209521175e-05, + "loss": 0.1406, + "step": 26355 + }, + { + "epoch": 2.58, + "learning_rate": 2.0577359535012456e-05, + "loss": 0.1262, + "step": 26360 + }, + { + "epoch": 2.58, + "learning_rate": 2.0573207860503736e-05, + "loss": 0.1175, + "step": 26365 + }, + { + "epoch": 2.58, + "learning_rate": 2.056905618599502e-05, + "loss": 0.1365, + "step": 26370 + }, + { + "epoch": 2.58, + "learning_rate": 2.05649045114863e-05, + "loss": 0.1366, + "step": 26375 + }, + { + "epoch": 2.58, + "learning_rate": 2.0560752836977582e-05, + "loss": 0.1273, + "step": 26380 + }, + { + "epoch": 2.58, + "learning_rate": 2.0556601162468863e-05, + "loss": 0.1125, + "step": 26385 + }, + { + "epoch": 2.58, + "learning_rate": 2.0552449487960144e-05, + "loss": 0.1466, + "step": 26390 + }, + { + "epoch": 2.58, + "learning_rate": 2.0548297813451424e-05, + "loss": 0.1082, + "step": 26395 + }, + { + "epoch": 2.58, + "learning_rate": 2.0544146138942705e-05, + "loss": 0.1112, + "step": 26400 + }, + { + "epoch": 2.58, + "learning_rate": 2.053999446443399e-05, + "loss": 0.1557, + "step": 26405 + }, + { + "epoch": 2.58, + "learning_rate": 2.053584278992527e-05, + "loss": 0.1148, + "step": 26410 + }, + { + "epoch": 2.58, + "learning_rate": 2.0531691115416554e-05, + "loss": 0.1138, + "step": 26415 + }, + { + "epoch": 2.58, + "learning_rate": 2.0527539440907835e-05, + "loss": 0.112, + "step": 26420 + }, + { + "epoch": 2.58, + "learning_rate": 2.0523387766399116e-05, + "loss": 0.1506, + "step": 26425 + }, + { + "epoch": 2.58, + "learning_rate": 2.0519236091890397e-05, + "loss": 0.1213, + "step": 26430 + }, + { + "epoch": 2.58, + "learning_rate": 2.0515084417381677e-05, + "loss": 0.1117, + "step": 26435 + }, + { + "epoch": 2.59, + "learning_rate": 2.0510932742872958e-05, + "loss": 0.1447, + "step": 26440 + }, + { + "epoch": 2.59, + "learning_rate": 2.050678106836424e-05, + "loss": 0.1117, + "step": 26445 + }, + { + "epoch": 2.59, + "learning_rate": 2.050262939385552e-05, + "loss": 0.0965, + "step": 26450 + }, + { + "epoch": 2.59, + "learning_rate": 2.0498477719346804e-05, + "loss": 0.1377, + "step": 26455 + }, + { + "epoch": 2.59, + "learning_rate": 2.0494326044838088e-05, + "loss": 0.1232, + "step": 26460 + }, + { + "epoch": 2.59, + "learning_rate": 2.049017437032937e-05, + "loss": 0.1121, + "step": 26465 + }, + { + "epoch": 2.59, + "learning_rate": 2.048602269582065e-05, + "loss": 0.1234, + "step": 26470 + }, + { + "epoch": 2.59, + "learning_rate": 2.048187102131193e-05, + "loss": 0.1284, + "step": 26475 + }, + { + "epoch": 2.59, + "learning_rate": 2.047771934680321e-05, + "loss": 0.1074, + "step": 26480 + }, + { + "epoch": 2.59, + "learning_rate": 2.0473567672294492e-05, + "loss": 0.1067, + "step": 26485 + }, + { + "epoch": 2.59, + "learning_rate": 2.0469415997785773e-05, + "loss": 0.1385, + "step": 26490 + }, + { + "epoch": 2.59, + "learning_rate": 2.0465264323277053e-05, + "loss": 0.1314, + "step": 26495 + }, + { + "epoch": 2.59, + "learning_rate": 2.0461112648768337e-05, + "loss": 0.1238, + "step": 26500 + }, + { + "epoch": 2.59, + "eval_cer": 0.06162031673800093, + "eval_loss": 0.25676214694976807, + "eval_runtime": 276.1673, + "eval_samples_per_second": 59.276, + "eval_steps_per_second": 1.648, + "eval_wer": 0.15653343606955591, + "step": 26500 + }, + { + "epoch": 2.59, + "learning_rate": 2.0456960974259618e-05, + "loss": 0.1565, + "step": 26505 + }, + { + "epoch": 2.59, + "learning_rate": 2.0452809299750902e-05, + "loss": 0.1191, + "step": 26510 + }, + { + "epoch": 2.59, + "learning_rate": 2.0448657625242183e-05, + "loss": 0.1073, + "step": 26515 + }, + { + "epoch": 2.59, + "learning_rate": 2.0444505950733464e-05, + "loss": 0.1337, + "step": 26520 + }, + { + "epoch": 2.59, + "learning_rate": 2.0440354276224745e-05, + "loss": 0.1318, + "step": 26525 + }, + { + "epoch": 2.59, + "learning_rate": 2.0436202601716025e-05, + "loss": 0.1164, + "step": 26530 + }, + { + "epoch": 2.59, + "learning_rate": 2.0432050927207306e-05, + "loss": 0.1163, + "step": 26535 + }, + { + "epoch": 2.6, + "learning_rate": 2.0427899252698587e-05, + "loss": 0.1373, + "step": 26540 + }, + { + "epoch": 2.6, + "learning_rate": 2.042374757818987e-05, + "loss": 0.117, + "step": 26545 + }, + { + "epoch": 2.6, + "learning_rate": 2.0419595903681152e-05, + "loss": 0.0874, + "step": 26550 + }, + { + "epoch": 2.6, + "learning_rate": 2.0415444229172433e-05, + "loss": 0.1243, + "step": 26555 + }, + { + "epoch": 2.6, + "learning_rate": 2.0411292554663717e-05, + "loss": 0.1373, + "step": 26560 + }, + { + "epoch": 2.6, + "learning_rate": 2.0407140880154998e-05, + "loss": 0.1012, + "step": 26565 + }, + { + "epoch": 2.6, + "learning_rate": 2.040298920564628e-05, + "loss": 0.1101, + "step": 26570 + }, + { + "epoch": 2.6, + "learning_rate": 2.039883753113756e-05, + "loss": 0.1469, + "step": 26575 + }, + { + "epoch": 2.6, + "learning_rate": 2.039468585662884e-05, + "loss": 0.1203, + "step": 26580 + }, + { + "epoch": 2.6, + "learning_rate": 2.039053418212012e-05, + "loss": 0.1039, + "step": 26585 + }, + { + "epoch": 2.6, + "learning_rate": 2.0386382507611405e-05, + "loss": 0.1309, + "step": 26590 + }, + { + "epoch": 2.6, + "learning_rate": 2.0382230833102686e-05, + "loss": 0.1089, + "step": 26595 + }, + { + "epoch": 2.6, + "learning_rate": 2.0378079158593966e-05, + "loss": 0.0967, + "step": 26600 + }, + { + "epoch": 2.6, + "learning_rate": 2.0373927484085247e-05, + "loss": 0.1451, + "step": 26605 + }, + { + "epoch": 2.6, + "learning_rate": 2.036977580957653e-05, + "loss": 0.1239, + "step": 26610 + }, + { + "epoch": 2.6, + "learning_rate": 2.0365624135067812e-05, + "loss": 0.1087, + "step": 26615 + }, + { + "epoch": 2.6, + "learning_rate": 2.0361472460559093e-05, + "loss": 0.1104, + "step": 26620 + }, + { + "epoch": 2.6, + "learning_rate": 2.0357320786050374e-05, + "loss": 0.1354, + "step": 26625 + }, + { + "epoch": 2.6, + "learning_rate": 2.0353169111541654e-05, + "loss": 0.1185, + "step": 26630 + }, + { + "epoch": 2.6, + "learning_rate": 2.034901743703294e-05, + "loss": 0.1037, + "step": 26635 + }, + { + "epoch": 2.6, + "learning_rate": 2.034486576252422e-05, + "loss": 0.143, + "step": 26640 + }, + { + "epoch": 2.61, + "learning_rate": 2.03407140880155e-05, + "loss": 0.103, + "step": 26645 + }, + { + "epoch": 2.61, + "learning_rate": 2.033656241350678e-05, + "loss": 0.1061, + "step": 26650 + }, + { + "epoch": 2.61, + "learning_rate": 2.033241073899806e-05, + "loss": 0.1552, + "step": 26655 + }, + { + "epoch": 2.61, + "learning_rate": 2.0328259064489342e-05, + "loss": 0.1231, + "step": 26660 + }, + { + "epoch": 2.61, + "learning_rate": 2.0324107389980627e-05, + "loss": 0.127, + "step": 26665 + }, + { + "epoch": 2.61, + "learning_rate": 2.0319955715471907e-05, + "loss": 0.1159, + "step": 26670 + }, + { + "epoch": 2.61, + "learning_rate": 2.031580404096319e-05, + "loss": 0.1239, + "step": 26675 + }, + { + "epoch": 2.61, + "learning_rate": 2.0311652366454472e-05, + "loss": 0.1127, + "step": 26680 + }, + { + "epoch": 2.61, + "learning_rate": 2.0307500691945753e-05, + "loss": 0.13, + "step": 26685 + }, + { + "epoch": 2.61, + "learning_rate": 2.0303349017437034e-05, + "loss": 0.1325, + "step": 26690 + }, + { + "epoch": 2.61, + "learning_rate": 2.0299197342928315e-05, + "loss": 0.1156, + "step": 26695 + }, + { + "epoch": 2.61, + "learning_rate": 2.0295045668419595e-05, + "loss": 0.096, + "step": 26700 + }, + { + "epoch": 2.61, + "learning_rate": 2.0290893993910876e-05, + "loss": 0.1799, + "step": 26705 + }, + { + "epoch": 2.61, + "learning_rate": 2.0286742319402157e-05, + "loss": 0.1234, + "step": 26710 + }, + { + "epoch": 2.61, + "learning_rate": 2.028259064489344e-05, + "loss": 0.1086, + "step": 26715 + }, + { + "epoch": 2.61, + "learning_rate": 2.0278438970384725e-05, + "loss": 0.117, + "step": 26720 + }, + { + "epoch": 2.61, + "learning_rate": 2.0274287295876006e-05, + "loss": 0.1346, + "step": 26725 + }, + { + "epoch": 2.61, + "learning_rate": 2.0270135621367287e-05, + "loss": 0.1167, + "step": 26730 + }, + { + "epoch": 2.61, + "learning_rate": 2.0265983946858567e-05, + "loss": 0.1106, + "step": 26735 + }, + { + "epoch": 2.61, + "learning_rate": 2.0261832272349848e-05, + "loss": 0.1447, + "step": 26740 + }, + { + "epoch": 2.62, + "learning_rate": 2.025768059784113e-05, + "loss": 0.1174, + "step": 26745 + }, + { + "epoch": 2.62, + "learning_rate": 2.025352892333241e-05, + "loss": 0.1178, + "step": 26750 + }, + { + "epoch": 2.62, + "learning_rate": 2.024937724882369e-05, + "loss": 0.1232, + "step": 26755 + }, + { + "epoch": 2.62, + "learning_rate": 2.024522557431497e-05, + "loss": 0.1154, + "step": 26760 + }, + { + "epoch": 2.62, + "learning_rate": 2.024107389980626e-05, + "loss": 0.1196, + "step": 26765 + }, + { + "epoch": 2.62, + "learning_rate": 2.023692222529754e-05, + "loss": 0.1267, + "step": 26770 + }, + { + "epoch": 2.62, + "learning_rate": 2.023277055078882e-05, + "loss": 0.1379, + "step": 26775 + }, + { + "epoch": 2.62, + "learning_rate": 2.02286188762801e-05, + "loss": 0.111, + "step": 26780 + }, + { + "epoch": 2.62, + "learning_rate": 2.0224467201771382e-05, + "loss": 0.1084, + "step": 26785 + }, + { + "epoch": 2.62, + "learning_rate": 2.0220315527262663e-05, + "loss": 0.1382, + "step": 26790 + }, + { + "epoch": 2.62, + "learning_rate": 2.0216163852753943e-05, + "loss": 0.1118, + "step": 26795 + }, + { + "epoch": 2.62, + "learning_rate": 2.0212012178245224e-05, + "loss": 0.11, + "step": 26800 + }, + { + "epoch": 2.62, + "learning_rate": 2.0207860503736505e-05, + "loss": 0.1195, + "step": 26805 + }, + { + "epoch": 2.62, + "learning_rate": 2.020370882922779e-05, + "loss": 0.1293, + "step": 26810 + }, + { + "epoch": 2.62, + "learning_rate": 2.0199557154719073e-05, + "loss": 0.1227, + "step": 26815 + }, + { + "epoch": 2.62, + "learning_rate": 2.0195405480210354e-05, + "loss": 0.1311, + "step": 26820 + }, + { + "epoch": 2.62, + "learning_rate": 2.0191253805701635e-05, + "loss": 0.146, + "step": 26825 + }, + { + "epoch": 2.62, + "learning_rate": 2.0187102131192916e-05, + "loss": 0.1211, + "step": 26830 + }, + { + "epoch": 2.62, + "learning_rate": 2.0182950456684196e-05, + "loss": 0.1109, + "step": 26835 + }, + { + "epoch": 2.62, + "learning_rate": 2.0178798782175477e-05, + "loss": 0.1394, + "step": 26840 + }, + { + "epoch": 2.62, + "learning_rate": 2.0174647107666758e-05, + "loss": 0.1235, + "step": 26845 + }, + { + "epoch": 2.63, + "learning_rate": 2.017049543315804e-05, + "loss": 0.1006, + "step": 26850 + }, + { + "epoch": 2.63, + "learning_rate": 2.0166343758649323e-05, + "loss": 0.1228, + "step": 26855 + }, + { + "epoch": 2.63, + "learning_rate": 2.0162192084140604e-05, + "loss": 0.1278, + "step": 26860 + }, + { + "epoch": 2.63, + "learning_rate": 2.0158040409631884e-05, + "loss": 0.1036, + "step": 26865 + }, + { + "epoch": 2.63, + "learning_rate": 2.015388873512317e-05, + "loss": 0.1106, + "step": 26870 + }, + { + "epoch": 2.63, + "learning_rate": 2.014973706061445e-05, + "loss": 0.1468, + "step": 26875 + }, + { + "epoch": 2.63, + "learning_rate": 2.014558538610573e-05, + "loss": 0.1185, + "step": 26880 + }, + { + "epoch": 2.63, + "learning_rate": 2.014143371159701e-05, + "loss": 0.1161, + "step": 26885 + }, + { + "epoch": 2.63, + "learning_rate": 2.013728203708829e-05, + "loss": 0.1399, + "step": 26890 + }, + { + "epoch": 2.63, + "learning_rate": 2.0133130362579572e-05, + "loss": 0.1074, + "step": 26895 + }, + { + "epoch": 2.63, + "learning_rate": 2.0128978688070857e-05, + "loss": 0.1149, + "step": 26900 + }, + { + "epoch": 2.63, + "learning_rate": 2.0124827013562137e-05, + "loss": 0.1277, + "step": 26905 + }, + { + "epoch": 2.63, + "learning_rate": 2.0120675339053418e-05, + "loss": 0.1098, + "step": 26910 + }, + { + "epoch": 2.63, + "learning_rate": 2.01165236645447e-05, + "loss": 0.1116, + "step": 26915 + }, + { + "epoch": 2.63, + "learning_rate": 2.0112371990035983e-05, + "loss": 0.1188, + "step": 26920 + }, + { + "epoch": 2.63, + "learning_rate": 2.0108220315527264e-05, + "loss": 0.134, + "step": 26925 + }, + { + "epoch": 2.63, + "learning_rate": 2.0104068641018545e-05, + "loss": 0.1164, + "step": 26930 + }, + { + "epoch": 2.63, + "learning_rate": 2.0099916966509825e-05, + "loss": 0.1198, + "step": 26935 + }, + { + "epoch": 2.63, + "learning_rate": 2.009576529200111e-05, + "loss": 0.1383, + "step": 26940 + }, + { + "epoch": 2.63, + "learning_rate": 2.009161361749239e-05, + "loss": 0.113, + "step": 26945 + }, + { + "epoch": 2.64, + "learning_rate": 2.008746194298367e-05, + "loss": 0.1381, + "step": 26950 + }, + { + "epoch": 2.64, + "learning_rate": 2.0083310268474952e-05, + "loss": 0.1401, + "step": 26955 + }, + { + "epoch": 2.64, + "learning_rate": 2.0079158593966233e-05, + "loss": 0.1348, + "step": 26960 + }, + { + "epoch": 2.64, + "learning_rate": 2.0075006919457513e-05, + "loss": 0.1236, + "step": 26965 + }, + { + "epoch": 2.64, + "learning_rate": 2.0070855244948797e-05, + "loss": 0.1193, + "step": 26970 + }, + { + "epoch": 2.64, + "learning_rate": 2.0066703570440078e-05, + "loss": 0.1369, + "step": 26975 + }, + { + "epoch": 2.64, + "learning_rate": 2.006255189593136e-05, + "loss": 0.1112, + "step": 26980 + }, + { + "epoch": 2.64, + "learning_rate": 2.0058400221422643e-05, + "loss": 0.1164, + "step": 26985 + }, + { + "epoch": 2.64, + "learning_rate": 2.0054248546913924e-05, + "loss": 0.1276, + "step": 26990 + }, + { + "epoch": 2.64, + "learning_rate": 2.0050096872405205e-05, + "loss": 0.1169, + "step": 26995 + }, + { + "epoch": 2.64, + "learning_rate": 2.0045945197896485e-05, + "loss": 0.1178, + "step": 27000 + }, + { + "epoch": 2.64, + "eval_cer": 0.061490828286752175, + "eval_loss": 0.25637540221214294, + "eval_runtime": 272.7475, + "eval_samples_per_second": 60.019, + "eval_steps_per_second": 1.668, + "eval_wer": 0.15738231587470533, + "step": 27000 + }, + { + "epoch": 2.64, + "learning_rate": 2.0041793523387766e-05, + "loss": 0.1424, + "step": 27005 + }, + { + "epoch": 2.64, + "learning_rate": 2.0037641848879047e-05, + "loss": 0.125, + "step": 27010 + }, + { + "epoch": 2.64, + "learning_rate": 2.0033490174370328e-05, + "loss": 0.1268, + "step": 27015 + }, + { + "epoch": 2.64, + "learning_rate": 2.0029338499861612e-05, + "loss": 0.1122, + "step": 27020 + }, + { + "epoch": 2.64, + "learning_rate": 2.0025186825352893e-05, + "loss": 0.1506, + "step": 27025 + }, + { + "epoch": 2.64, + "learning_rate": 2.0021035150844177e-05, + "loss": 0.1157, + "step": 27030 + }, + { + "epoch": 2.64, + "learning_rate": 2.0016883476335458e-05, + "loss": 0.1368, + "step": 27035 + }, + { + "epoch": 2.64, + "learning_rate": 2.001273180182674e-05, + "loss": 0.1485, + "step": 27040 + }, + { + "epoch": 2.64, + "learning_rate": 2.000858012731802e-05, + "loss": 0.1164, + "step": 27045 + }, + { + "epoch": 2.65, + "learning_rate": 2.00044284528093e-05, + "loss": 0.1058, + "step": 27050 + }, + { + "epoch": 2.65, + "learning_rate": 2.000027677830058e-05, + "loss": 0.1105, + "step": 27055 + }, + { + "epoch": 2.65, + "learning_rate": 1.999612510379186e-05, + "loss": 0.1168, + "step": 27060 + }, + { + "epoch": 2.65, + "learning_rate": 1.9991973429283142e-05, + "loss": 0.1183, + "step": 27065 + }, + { + "epoch": 2.65, + "learning_rate": 1.9987821754774423e-05, + "loss": 0.1313, + "step": 27070 + }, + { + "epoch": 2.65, + "learning_rate": 1.998367008026571e-05, + "loss": 0.1315, + "step": 27075 + }, + { + "epoch": 2.65, + "learning_rate": 1.997951840575699e-05, + "loss": 0.105, + "step": 27080 + }, + { + "epoch": 2.65, + "learning_rate": 1.9975366731248272e-05, + "loss": 0.1184, + "step": 27085 + }, + { + "epoch": 2.65, + "learning_rate": 1.9971215056739553e-05, + "loss": 0.1315, + "step": 27090 + }, + { + "epoch": 2.65, + "learning_rate": 1.9967063382230834e-05, + "loss": 0.1124, + "step": 27095 + }, + { + "epoch": 2.65, + "learning_rate": 1.9962911707722114e-05, + "loss": 0.1135, + "step": 27100 + }, + { + "epoch": 2.65, + "learning_rate": 1.9958760033213395e-05, + "loss": 0.1387, + "step": 27105 + }, + { + "epoch": 2.65, + "learning_rate": 1.9954608358704676e-05, + "loss": 0.1226, + "step": 27110 + }, + { + "epoch": 2.65, + "learning_rate": 1.9950456684195957e-05, + "loss": 0.1247, + "step": 27115 + }, + { + "epoch": 2.65, + "learning_rate": 1.994630500968724e-05, + "loss": 0.1294, + "step": 27120 + }, + { + "epoch": 2.65, + "learning_rate": 1.9942153335178525e-05, + "loss": 0.1626, + "step": 27125 + }, + { + "epoch": 2.65, + "learning_rate": 1.9938001660669806e-05, + "loss": 0.1169, + "step": 27130 + }, + { + "epoch": 2.65, + "learning_rate": 1.9933849986161087e-05, + "loss": 0.1179, + "step": 27135 + }, + { + "epoch": 2.65, + "learning_rate": 1.9929698311652367e-05, + "loss": 0.1454, + "step": 27140 + }, + { + "epoch": 2.65, + "learning_rate": 1.9925546637143648e-05, + "loss": 0.1112, + "step": 27145 + }, + { + "epoch": 2.65, + "learning_rate": 1.992139496263493e-05, + "loss": 0.1113, + "step": 27150 + }, + { + "epoch": 2.66, + "learning_rate": 1.991724328812621e-05, + "loss": 0.1344, + "step": 27155 + }, + { + "epoch": 2.66, + "learning_rate": 1.9913091613617494e-05, + "loss": 0.1129, + "step": 27160 + }, + { + "epoch": 2.66, + "learning_rate": 1.9908939939108775e-05, + "loss": 0.1107, + "step": 27165 + }, + { + "epoch": 2.66, + "learning_rate": 1.9904788264600055e-05, + "loss": 0.123, + "step": 27170 + }, + { + "epoch": 2.66, + "learning_rate": 1.990063659009134e-05, + "loss": 0.1338, + "step": 27175 + }, + { + "epoch": 2.66, + "learning_rate": 1.989648491558262e-05, + "loss": 0.1148, + "step": 27180 + }, + { + "epoch": 2.66, + "learning_rate": 1.98923332410739e-05, + "loss": 0.1029, + "step": 27185 + }, + { + "epoch": 2.66, + "learning_rate": 1.9888181566565182e-05, + "loss": 0.1454, + "step": 27190 + }, + { + "epoch": 2.66, + "learning_rate": 1.9884029892056463e-05, + "loss": 0.1146, + "step": 27195 + }, + { + "epoch": 2.66, + "learning_rate": 1.9879878217547743e-05, + "loss": 0.117, + "step": 27200 + }, + { + "epoch": 2.66, + "learning_rate": 1.9875726543039027e-05, + "loss": 0.1443, + "step": 27205 + }, + { + "epoch": 2.66, + "learning_rate": 1.9871574868530308e-05, + "loss": 0.1322, + "step": 27210 + }, + { + "epoch": 2.66, + "learning_rate": 1.986742319402159e-05, + "loss": 0.1393, + "step": 27215 + }, + { + "epoch": 2.66, + "learning_rate": 1.986327151951287e-05, + "loss": 0.1241, + "step": 27220 + }, + { + "epoch": 2.66, + "learning_rate": 1.9859119845004154e-05, + "loss": 0.1317, + "step": 27225 + }, + { + "epoch": 2.66, + "learning_rate": 1.9854968170495435e-05, + "loss": 0.117, + "step": 27230 + }, + { + "epoch": 2.66, + "learning_rate": 1.9850816495986715e-05, + "loss": 0.1128, + "step": 27235 + }, + { + "epoch": 2.66, + "learning_rate": 1.9846664821477996e-05, + "loss": 0.1409, + "step": 27240 + }, + { + "epoch": 2.66, + "learning_rate": 1.9842513146969277e-05, + "loss": 0.1121, + "step": 27245 + }, + { + "epoch": 2.66, + "learning_rate": 1.983836147246056e-05, + "loss": 0.1162, + "step": 27250 + }, + { + "epoch": 2.67, + "learning_rate": 1.9834209797951842e-05, + "loss": 0.1493, + "step": 27255 + }, + { + "epoch": 2.67, + "learning_rate": 1.9830058123443123e-05, + "loss": 0.1189, + "step": 27260 + }, + { + "epoch": 2.67, + "learning_rate": 1.9825906448934403e-05, + "loss": 0.1233, + "step": 27265 + }, + { + "epoch": 2.67, + "learning_rate": 1.9821754774425684e-05, + "loss": 0.126, + "step": 27270 + }, + { + "epoch": 2.67, + "learning_rate": 1.9817603099916965e-05, + "loss": 0.1436, + "step": 27275 + }, + { + "epoch": 2.67, + "learning_rate": 1.981345142540825e-05, + "loss": 0.1136, + "step": 27280 + }, + { + "epoch": 2.67, + "learning_rate": 1.980929975089953e-05, + "loss": 0.1059, + "step": 27285 + }, + { + "epoch": 2.67, + "learning_rate": 1.980514807639081e-05, + "loss": 0.1464, + "step": 27290 + }, + { + "epoch": 2.67, + "learning_rate": 1.9800996401882095e-05, + "loss": 0.1121, + "step": 27295 + }, + { + "epoch": 2.67, + "learning_rate": 1.9796844727373376e-05, + "loss": 0.1119, + "step": 27300 + }, + { + "epoch": 2.67, + "learning_rate": 1.9792693052864656e-05, + "loss": 0.1305, + "step": 27305 + }, + { + "epoch": 2.67, + "learning_rate": 1.9788541378355937e-05, + "loss": 0.1364, + "step": 27310 + }, + { + "epoch": 2.67, + "learning_rate": 1.9784389703847218e-05, + "loss": 0.1078, + "step": 27315 + }, + { + "epoch": 2.67, + "learning_rate": 1.97802380293385e-05, + "loss": 0.1319, + "step": 27320 + }, + { + "epoch": 2.67, + "learning_rate": 1.977608635482978e-05, + "loss": 0.1391, + "step": 27325 + }, + { + "epoch": 2.67, + "learning_rate": 1.9771934680321064e-05, + "loss": 0.1227, + "step": 27330 + }, + { + "epoch": 2.67, + "learning_rate": 1.9767783005812344e-05, + "loss": 0.1106, + "step": 27335 + }, + { + "epoch": 2.67, + "learning_rate": 1.976363133130363e-05, + "loss": 0.1332, + "step": 27340 + }, + { + "epoch": 2.67, + "learning_rate": 1.975947965679491e-05, + "loss": 0.1009, + "step": 27345 + }, + { + "epoch": 2.67, + "learning_rate": 1.975532798228619e-05, + "loss": 0.1193, + "step": 27350 + }, + { + "epoch": 2.67, + "learning_rate": 1.975117630777747e-05, + "loss": 0.1376, + "step": 27355 + }, + { + "epoch": 2.68, + "learning_rate": 1.974702463326875e-05, + "loss": 0.1124, + "step": 27360 + }, + { + "epoch": 2.68, + "learning_rate": 1.9742872958760032e-05, + "loss": 0.118, + "step": 27365 + }, + { + "epoch": 2.68, + "learning_rate": 1.9738721284251313e-05, + "loss": 0.1182, + "step": 27370 + }, + { + "epoch": 2.68, + "learning_rate": 1.9734569609742594e-05, + "loss": 0.143, + "step": 27375 + }, + { + "epoch": 2.68, + "learning_rate": 1.973041793523388e-05, + "loss": 0.1314, + "step": 27380 + }, + { + "epoch": 2.68, + "learning_rate": 1.9726266260725162e-05, + "loss": 0.1098, + "step": 27385 + }, + { + "epoch": 2.68, + "learning_rate": 1.9722114586216443e-05, + "loss": 0.1334, + "step": 27390 + }, + { + "epoch": 2.68, + "learning_rate": 1.9717962911707724e-05, + "loss": 0.117, + "step": 27395 + }, + { + "epoch": 2.68, + "learning_rate": 1.9713811237199004e-05, + "loss": 0.1051, + "step": 27400 + }, + { + "epoch": 2.68, + "learning_rate": 1.9709659562690285e-05, + "loss": 0.1334, + "step": 27405 + }, + { + "epoch": 2.68, + "learning_rate": 1.9705507888181566e-05, + "loss": 0.1225, + "step": 27410 + }, + { + "epoch": 2.68, + "learning_rate": 1.9701356213672847e-05, + "loss": 0.1043, + "step": 27415 + }, + { + "epoch": 2.68, + "learning_rate": 1.9697204539164128e-05, + "loss": 0.1282, + "step": 27420 + }, + { + "epoch": 2.68, + "learning_rate": 1.9693052864655412e-05, + "loss": 0.1498, + "step": 27425 + }, + { + "epoch": 2.68, + "learning_rate": 1.9688901190146696e-05, + "loss": 0.1136, + "step": 27430 + }, + { + "epoch": 2.68, + "learning_rate": 1.9684749515637977e-05, + "loss": 0.1174, + "step": 27435 + }, + { + "epoch": 2.68, + "learning_rate": 1.9680597841129257e-05, + "loss": 0.1481, + "step": 27440 + }, + { + "epoch": 2.68, + "learning_rate": 1.9676446166620538e-05, + "loss": 0.1154, + "step": 27445 + }, + { + "epoch": 2.68, + "learning_rate": 1.967229449211182e-05, + "loss": 0.1146, + "step": 27450 + }, + { + "epoch": 2.68, + "learning_rate": 1.96681428176031e-05, + "loss": 0.1333, + "step": 27455 + }, + { + "epoch": 2.69, + "learning_rate": 1.966399114309438e-05, + "loss": 0.1206, + "step": 27460 + }, + { + "epoch": 2.69, + "learning_rate": 1.965983946858566e-05, + "loss": 0.0973, + "step": 27465 + }, + { + "epoch": 2.69, + "learning_rate": 1.9655687794076945e-05, + "loss": 0.124, + "step": 27470 + }, + { + "epoch": 2.69, + "learning_rate": 1.9651536119568226e-05, + "loss": 0.1336, + "step": 27475 + }, + { + "epoch": 2.69, + "learning_rate": 1.9647384445059507e-05, + "loss": 0.1151, + "step": 27480 + }, + { + "epoch": 2.69, + "learning_rate": 1.964323277055079e-05, + "loss": 0.1238, + "step": 27485 + }, + { + "epoch": 2.69, + "learning_rate": 1.9639081096042072e-05, + "loss": 0.1454, + "step": 27490 + }, + { + "epoch": 2.69, + "learning_rate": 1.9634929421533353e-05, + "loss": 0.1156, + "step": 27495 + }, + { + "epoch": 2.69, + "learning_rate": 1.9630777747024633e-05, + "loss": 0.1207, + "step": 27500 + }, + { + "epoch": 2.69, + "eval_cer": 0.060481512055143585, + "eval_loss": 0.24564869701862335, + "eval_runtime": 278.6272, + "eval_samples_per_second": 58.752, + "eval_steps_per_second": 1.633, + "eval_wer": 0.1551752283813168, + "step": 27500 + }, + { + "epoch": 2.69, + "learning_rate": 1.9626626072515914e-05, + "loss": 0.1396, + "step": 27505 + }, + { + "epoch": 2.69, + "learning_rate": 1.9622474398007195e-05, + "loss": 0.1065, + "step": 27510 + }, + { + "epoch": 2.69, + "learning_rate": 1.961832272349848e-05, + "loss": 0.1239, + "step": 27515 + }, + { + "epoch": 2.69, + "learning_rate": 1.961417104898976e-05, + "loss": 0.1185, + "step": 27520 + }, + { + "epoch": 2.69, + "learning_rate": 1.961001937448104e-05, + "loss": 0.1497, + "step": 27525 + }, + { + "epoch": 2.69, + "learning_rate": 1.960586769997232e-05, + "loss": 0.1131, + "step": 27530 + }, + { + "epoch": 2.69, + "learning_rate": 1.9601716025463606e-05, + "loss": 0.1247, + "step": 27535 + }, + { + "epoch": 2.69, + "learning_rate": 1.9597564350954886e-05, + "loss": 0.1354, + "step": 27540 + }, + { + "epoch": 2.69, + "learning_rate": 1.9593412676446167e-05, + "loss": 0.1133, + "step": 27545 + }, + { + "epoch": 2.69, + "learning_rate": 1.9589261001937448e-05, + "loss": 0.1187, + "step": 27550 + }, + { + "epoch": 2.69, + "learning_rate": 1.958510932742873e-05, + "loss": 0.1454, + "step": 27555 + }, + { + "epoch": 2.69, + "learning_rate": 1.9580957652920013e-05, + "loss": 0.133, + "step": 27560 + }, + { + "epoch": 2.7, + "learning_rate": 1.9576805978411294e-05, + "loss": 0.1124, + "step": 27565 + }, + { + "epoch": 2.7, + "learning_rate": 1.9572654303902574e-05, + "loss": 0.1199, + "step": 27570 + }, + { + "epoch": 2.7, + "learning_rate": 1.9568502629393855e-05, + "loss": 0.1495, + "step": 27575 + }, + { + "epoch": 2.7, + "learning_rate": 1.9564350954885136e-05, + "loss": 0.1259, + "step": 27580 + }, + { + "epoch": 2.7, + "learning_rate": 1.956019928037642e-05, + "loss": 0.1161, + "step": 27585 + }, + { + "epoch": 2.7, + "learning_rate": 1.95560476058677e-05, + "loss": 0.1393, + "step": 27590 + }, + { + "epoch": 2.7, + "learning_rate": 1.955189593135898e-05, + "loss": 0.121, + "step": 27595 + }, + { + "epoch": 2.7, + "learning_rate": 1.9547744256850262e-05, + "loss": 0.1142, + "step": 27600 + }, + { + "epoch": 2.7, + "learning_rate": 1.9543592582341546e-05, + "loss": 0.1214, + "step": 27605 + }, + { + "epoch": 2.7, + "learning_rate": 1.9539440907832827e-05, + "loss": 0.1102, + "step": 27610 + }, + { + "epoch": 2.7, + "learning_rate": 1.9535289233324108e-05, + "loss": 0.1083, + "step": 27615 + }, + { + "epoch": 2.7, + "learning_rate": 1.953113755881539e-05, + "loss": 0.1121, + "step": 27620 + }, + { + "epoch": 2.7, + "learning_rate": 1.952698588430667e-05, + "loss": 0.1326, + "step": 27625 + }, + { + "epoch": 2.7, + "learning_rate": 1.952283420979795e-05, + "loss": 0.1183, + "step": 27630 + }, + { + "epoch": 2.7, + "learning_rate": 1.9518682535289234e-05, + "loss": 0.105, + "step": 27635 + }, + { + "epoch": 2.7, + "learning_rate": 1.9514530860780515e-05, + "loss": 0.1393, + "step": 27640 + }, + { + "epoch": 2.7, + "learning_rate": 1.95103791862718e-05, + "loss": 0.122, + "step": 27645 + }, + { + "epoch": 2.7, + "learning_rate": 1.950622751176308e-05, + "loss": 0.0957, + "step": 27650 + }, + { + "epoch": 2.7, + "learning_rate": 1.950207583725436e-05, + "loss": 0.1504, + "step": 27655 + }, + { + "epoch": 2.7, + "learning_rate": 1.9497924162745642e-05, + "loss": 0.1181, + "step": 27660 + }, + { + "epoch": 2.71, + "learning_rate": 1.9493772488236922e-05, + "loss": 0.1078, + "step": 27665 + }, + { + "epoch": 2.71, + "learning_rate": 1.9489620813728203e-05, + "loss": 0.1114, + "step": 27670 + }, + { + "epoch": 2.71, + "learning_rate": 1.9485469139219484e-05, + "loss": 0.1346, + "step": 27675 + }, + { + "epoch": 2.71, + "learning_rate": 1.9481317464710765e-05, + "loss": 0.1226, + "step": 27680 + }, + { + "epoch": 2.71, + "learning_rate": 1.9477165790202046e-05, + "loss": 0.1192, + "step": 27685 + }, + { + "epoch": 2.71, + "learning_rate": 1.9473014115693333e-05, + "loss": 0.1423, + "step": 27690 + }, + { + "epoch": 2.71, + "learning_rate": 1.9468862441184614e-05, + "loss": 0.1151, + "step": 27695 + }, + { + "epoch": 2.71, + "learning_rate": 1.9464710766675895e-05, + "loss": 0.1141, + "step": 27700 + }, + { + "epoch": 2.71, + "learning_rate": 1.9460559092167175e-05, + "loss": 0.1359, + "step": 27705 + }, + { + "epoch": 2.71, + "learning_rate": 1.9456407417658456e-05, + "loss": 0.1172, + "step": 27710 + }, + { + "epoch": 2.71, + "learning_rate": 1.9452255743149737e-05, + "loss": 0.1052, + "step": 27715 + }, + { + "epoch": 2.71, + "learning_rate": 1.9448104068641018e-05, + "loss": 0.1231, + "step": 27720 + }, + { + "epoch": 2.71, + "learning_rate": 1.94439523941323e-05, + "loss": 0.1392, + "step": 27725 + }, + { + "epoch": 2.71, + "learning_rate": 1.943980071962358e-05, + "loss": 0.1178, + "step": 27730 + }, + { + "epoch": 2.71, + "learning_rate": 1.9435649045114863e-05, + "loss": 0.1139, + "step": 27735 + }, + { + "epoch": 2.71, + "learning_rate": 1.9431497370606148e-05, + "loss": 0.14, + "step": 27740 + }, + { + "epoch": 2.71, + "learning_rate": 1.942734569609743e-05, + "loss": 0.1151, + "step": 27745 + }, + { + "epoch": 2.71, + "learning_rate": 1.942319402158871e-05, + "loss": 0.1194, + "step": 27750 + }, + { + "epoch": 2.71, + "learning_rate": 1.941904234707999e-05, + "loss": 0.1381, + "step": 27755 + }, + { + "epoch": 2.71, + "learning_rate": 1.941489067257127e-05, + "loss": 0.1199, + "step": 27760 + }, + { + "epoch": 2.71, + "learning_rate": 1.941073899806255e-05, + "loss": 0.1087, + "step": 27765 + }, + { + "epoch": 2.72, + "learning_rate": 1.9406587323553832e-05, + "loss": 0.1165, + "step": 27770 + }, + { + "epoch": 2.72, + "learning_rate": 1.9402435649045113e-05, + "loss": 0.1365, + "step": 27775 + }, + { + "epoch": 2.72, + "learning_rate": 1.9398283974536397e-05, + "loss": 0.1174, + "step": 27780 + }, + { + "epoch": 2.72, + "learning_rate": 1.9394132300027678e-05, + "loss": 0.1218, + "step": 27785 + }, + { + "epoch": 2.72, + "learning_rate": 1.9389980625518962e-05, + "loss": 0.1388, + "step": 27790 + }, + { + "epoch": 2.72, + "learning_rate": 1.9385828951010243e-05, + "loss": 0.1181, + "step": 27795 + }, + { + "epoch": 2.72, + "learning_rate": 1.9381677276501524e-05, + "loss": 0.1174, + "step": 27800 + }, + { + "epoch": 2.72, + "learning_rate": 1.9377525601992804e-05, + "loss": 0.147, + "step": 27805 + }, + { + "epoch": 2.72, + "learning_rate": 1.9373373927484085e-05, + "loss": 0.1177, + "step": 27810 + }, + { + "epoch": 2.72, + "learning_rate": 1.9369222252975366e-05, + "loss": 0.1232, + "step": 27815 + }, + { + "epoch": 2.72, + "learning_rate": 1.9365070578466647e-05, + "loss": 0.1358, + "step": 27820 + }, + { + "epoch": 2.72, + "learning_rate": 1.936091890395793e-05, + "loss": 0.1267, + "step": 27825 + }, + { + "epoch": 2.72, + "learning_rate": 1.935676722944921e-05, + "loss": 0.1061, + "step": 27830 + }, + { + "epoch": 2.72, + "learning_rate": 1.9352615554940492e-05, + "loss": 0.0983, + "step": 27835 + }, + { + "epoch": 2.72, + "learning_rate": 1.9348463880431776e-05, + "loss": 0.1372, + "step": 27840 + }, + { + "epoch": 2.72, + "learning_rate": 1.9344312205923057e-05, + "loss": 0.1186, + "step": 27845 + }, + { + "epoch": 2.72, + "learning_rate": 1.9340160531414338e-05, + "loss": 0.1057, + "step": 27850 + }, + { + "epoch": 2.72, + "learning_rate": 1.933600885690562e-05, + "loss": 0.1356, + "step": 27855 + }, + { + "epoch": 2.72, + "learning_rate": 1.93318571823969e-05, + "loss": 0.1204, + "step": 27860 + }, + { + "epoch": 2.72, + "learning_rate": 1.9327705507888184e-05, + "loss": 0.1179, + "step": 27865 + }, + { + "epoch": 2.73, + "learning_rate": 1.9323553833379464e-05, + "loss": 0.1147, + "step": 27870 + }, + { + "epoch": 2.73, + "learning_rate": 1.9319402158870745e-05, + "loss": 0.1334, + "step": 27875 + }, + { + "epoch": 2.73, + "learning_rate": 1.9315250484362026e-05, + "loss": 0.112, + "step": 27880 + }, + { + "epoch": 2.73, + "learning_rate": 1.9311098809853307e-05, + "loss": 0.1079, + "step": 27885 + }, + { + "epoch": 2.73, + "learning_rate": 1.9306947135344588e-05, + "loss": 0.1249, + "step": 27890 + }, + { + "epoch": 2.73, + "learning_rate": 1.9302795460835872e-05, + "loss": 0.1064, + "step": 27895 + }, + { + "epoch": 2.73, + "learning_rate": 1.9298643786327152e-05, + "loss": 0.1042, + "step": 27900 + }, + { + "epoch": 2.73, + "learning_rate": 1.9294492111818433e-05, + "loss": 0.1336, + "step": 27905 + }, + { + "epoch": 2.73, + "learning_rate": 1.9290340437309717e-05, + "loss": 0.1139, + "step": 27910 + }, + { + "epoch": 2.73, + "learning_rate": 1.9286188762800998e-05, + "loss": 0.1087, + "step": 27915 + }, + { + "epoch": 2.73, + "learning_rate": 1.928203708829228e-05, + "loss": 0.1072, + "step": 27920 + }, + { + "epoch": 2.73, + "learning_rate": 1.927788541378356e-05, + "loss": 0.1408, + "step": 27925 + }, + { + "epoch": 2.73, + "learning_rate": 1.927373373927484e-05, + "loss": 0.1075, + "step": 27930 + }, + { + "epoch": 2.73, + "learning_rate": 1.926958206476612e-05, + "loss": 0.1094, + "step": 27935 + }, + { + "epoch": 2.73, + "learning_rate": 1.9265430390257402e-05, + "loss": 0.1492, + "step": 27940 + }, + { + "epoch": 2.73, + "learning_rate": 1.9261278715748686e-05, + "loss": 0.1064, + "step": 27945 + }, + { + "epoch": 2.73, + "learning_rate": 1.9257127041239967e-05, + "loss": 0.1207, + "step": 27950 + }, + { + "epoch": 2.73, + "learning_rate": 1.925297536673125e-05, + "loss": 0.1416, + "step": 27955 + }, + { + "epoch": 2.73, + "learning_rate": 1.9248823692222532e-05, + "loss": 0.1294, + "step": 27960 + }, + { + "epoch": 2.73, + "learning_rate": 1.9244672017713813e-05, + "loss": 0.0998, + "step": 27965 + }, + { + "epoch": 2.74, + "learning_rate": 1.9240520343205093e-05, + "loss": 0.1186, + "step": 27970 + }, + { + "epoch": 2.74, + "learning_rate": 1.9236368668696374e-05, + "loss": 0.139, + "step": 27975 + }, + { + "epoch": 2.74, + "learning_rate": 1.9232216994187655e-05, + "loss": 0.1122, + "step": 27980 + }, + { + "epoch": 2.74, + "learning_rate": 1.9228065319678936e-05, + "loss": 0.1111, + "step": 27985 + }, + { + "epoch": 2.74, + "learning_rate": 1.9223913645170216e-05, + "loss": 0.1408, + "step": 27990 + }, + { + "epoch": 2.74, + "learning_rate": 1.92197619706615e-05, + "loss": 0.1042, + "step": 27995 + }, + { + "epoch": 2.74, + "learning_rate": 1.9215610296152785e-05, + "loss": 0.1112, + "step": 28000 + }, + { + "epoch": 2.74, + "eval_cer": 0.059457165914015044, + "eval_loss": 0.2433786690235138, + "eval_runtime": 272.8944, + "eval_samples_per_second": 59.987, + "eval_steps_per_second": 1.667, + "eval_wer": 0.15164258242296416, + "step": 28000 + }, + { + "epoch": 2.74, + "learning_rate": 1.9211458621644066e-05, + "loss": 0.133, + "step": 28005 + }, + { + "epoch": 2.74, + "learning_rate": 1.9207306947135346e-05, + "loss": 0.113, + "step": 28010 + }, + { + "epoch": 2.74, + "learning_rate": 1.9203155272626627e-05, + "loss": 0.0921, + "step": 28015 + }, + { + "epoch": 2.74, + "learning_rate": 1.9199003598117908e-05, + "loss": 0.1297, + "step": 28020 + }, + { + "epoch": 2.74, + "learning_rate": 1.919485192360919e-05, + "loss": 0.1336, + "step": 28025 + }, + { + "epoch": 2.74, + "learning_rate": 1.919070024910047e-05, + "loss": 0.1079, + "step": 28030 + }, + { + "epoch": 2.74, + "learning_rate": 1.918654857459175e-05, + "loss": 0.1287, + "step": 28035 + }, + { + "epoch": 2.74, + "learning_rate": 1.918239690008303e-05, + "loss": 0.1325, + "step": 28040 + }, + { + "epoch": 2.74, + "learning_rate": 1.917824522557432e-05, + "loss": 0.1349, + "step": 28045 + }, + { + "epoch": 2.74, + "learning_rate": 1.91740935510656e-05, + "loss": 0.1111, + "step": 28050 + }, + { + "epoch": 2.74, + "learning_rate": 1.916994187655688e-05, + "loss": 0.1397, + "step": 28055 + }, + { + "epoch": 2.74, + "learning_rate": 1.916579020204816e-05, + "loss": 0.1143, + "step": 28060 + }, + { + "epoch": 2.74, + "learning_rate": 1.916163852753944e-05, + "loss": 0.1073, + "step": 28065 + }, + { + "epoch": 2.74, + "learning_rate": 1.9157486853030722e-05, + "loss": 0.1164, + "step": 28070 + }, + { + "epoch": 2.75, + "learning_rate": 1.9153335178522003e-05, + "loss": 0.1362, + "step": 28075 + }, + { + "epoch": 2.75, + "learning_rate": 1.9149183504013284e-05, + "loss": 0.1248, + "step": 28080 + }, + { + "epoch": 2.75, + "learning_rate": 1.9145031829504568e-05, + "loss": 0.1237, + "step": 28085 + }, + { + "epoch": 2.75, + "learning_rate": 1.914088015499585e-05, + "loss": 0.1283, + "step": 28090 + }, + { + "epoch": 2.75, + "learning_rate": 1.913672848048713e-05, + "loss": 0.1223, + "step": 28095 + }, + { + "epoch": 2.75, + "learning_rate": 1.9132576805978414e-05, + "loss": 0.1146, + "step": 28100 + }, + { + "epoch": 2.75, + "learning_rate": 1.9128425131469694e-05, + "loss": 0.141, + "step": 28105 + }, + { + "epoch": 2.75, + "learning_rate": 1.9124273456960975e-05, + "loss": 0.1285, + "step": 28110 + }, + { + "epoch": 2.75, + "learning_rate": 1.9120121782452256e-05, + "loss": 0.1136, + "step": 28115 + }, + { + "epoch": 2.75, + "learning_rate": 1.9115970107943537e-05, + "loss": 0.1265, + "step": 28120 + }, + { + "epoch": 2.75, + "learning_rate": 1.9111818433434818e-05, + "loss": 0.1446, + "step": 28125 + }, + { + "epoch": 2.75, + "learning_rate": 1.9107666758926102e-05, + "loss": 0.1, + "step": 28130 + }, + { + "epoch": 2.75, + "learning_rate": 1.9103515084417382e-05, + "loss": 0.123, + "step": 28135 + }, + { + "epoch": 2.75, + "learning_rate": 1.9099363409908663e-05, + "loss": 0.1393, + "step": 28140 + }, + { + "epoch": 2.75, + "learning_rate": 1.9095211735399944e-05, + "loss": 0.12, + "step": 28145 + }, + { + "epoch": 2.75, + "learning_rate": 1.9091060060891228e-05, + "loss": 0.1141, + "step": 28150 + }, + { + "epoch": 2.75, + "learning_rate": 1.908690838638251e-05, + "loss": 0.1341, + "step": 28155 + }, + { + "epoch": 2.75, + "learning_rate": 1.908275671187379e-05, + "loss": 0.131, + "step": 28160 + }, + { + "epoch": 2.75, + "learning_rate": 1.907860503736507e-05, + "loss": 0.1053, + "step": 28165 + }, + { + "epoch": 2.75, + "learning_rate": 1.907445336285635e-05, + "loss": 0.1508, + "step": 28170 + }, + { + "epoch": 2.76, + "learning_rate": 1.9070301688347635e-05, + "loss": 0.1272, + "step": 28175 + }, + { + "epoch": 2.76, + "learning_rate": 1.9066150013838916e-05, + "loss": 0.1278, + "step": 28180 + }, + { + "epoch": 2.76, + "learning_rate": 1.9061998339330197e-05, + "loss": 0.1176, + "step": 28185 + }, + { + "epoch": 2.76, + "learning_rate": 1.9057846664821478e-05, + "loss": 0.1495, + "step": 28190 + }, + { + "epoch": 2.76, + "learning_rate": 1.905369499031276e-05, + "loss": 0.1156, + "step": 28195 + }, + { + "epoch": 2.76, + "learning_rate": 1.9049543315804043e-05, + "loss": 0.114, + "step": 28200 + }, + { + "epoch": 2.76, + "learning_rate": 1.9045391641295323e-05, + "loss": 0.1279, + "step": 28205 + }, + { + "epoch": 2.76, + "learning_rate": 1.9041239966786604e-05, + "loss": 0.1421, + "step": 28210 + }, + { + "epoch": 2.76, + "learning_rate": 1.9037088292277885e-05, + "loss": 0.1148, + "step": 28215 + }, + { + "epoch": 2.76, + "learning_rate": 1.903293661776917e-05, + "loss": 0.115, + "step": 28220 + }, + { + "epoch": 2.76, + "learning_rate": 1.902878494326045e-05, + "loss": 0.1501, + "step": 28225 + }, + { + "epoch": 2.76, + "learning_rate": 1.902463326875173e-05, + "loss": 0.1159, + "step": 28230 + }, + { + "epoch": 2.76, + "learning_rate": 1.902048159424301e-05, + "loss": 0.1074, + "step": 28235 + }, + { + "epoch": 2.76, + "learning_rate": 1.9016329919734292e-05, + "loss": 0.1348, + "step": 28240 + }, + { + "epoch": 2.76, + "learning_rate": 1.9012178245225573e-05, + "loss": 0.1204, + "step": 28245 + }, + { + "epoch": 2.76, + "learning_rate": 1.9008026570716857e-05, + "loss": 0.1039, + "step": 28250 + }, + { + "epoch": 2.76, + "learning_rate": 1.9003874896208138e-05, + "loss": 0.1393, + "step": 28255 + }, + { + "epoch": 2.76, + "learning_rate": 1.899972322169942e-05, + "loss": 0.139, + "step": 28260 + }, + { + "epoch": 2.76, + "learning_rate": 1.8995571547190703e-05, + "loss": 0.1005, + "step": 28265 + }, + { + "epoch": 2.76, + "learning_rate": 1.8991419872681984e-05, + "loss": 0.1393, + "step": 28270 + }, + { + "epoch": 2.76, + "learning_rate": 1.8987268198173264e-05, + "loss": 0.1301, + "step": 28275 + }, + { + "epoch": 2.77, + "learning_rate": 1.8983116523664545e-05, + "loss": 0.1195, + "step": 28280 + }, + { + "epoch": 2.77, + "learning_rate": 1.8978964849155826e-05, + "loss": 0.1152, + "step": 28285 + }, + { + "epoch": 2.77, + "learning_rate": 1.8974813174647107e-05, + "loss": 0.1307, + "step": 28290 + }, + { + "epoch": 2.77, + "learning_rate": 1.8970661500138387e-05, + "loss": 0.1158, + "step": 28295 + }, + { + "epoch": 2.77, + "learning_rate": 1.8966509825629668e-05, + "loss": 0.103, + "step": 28300 + }, + { + "epoch": 2.77, + "learning_rate": 1.8962358151120952e-05, + "loss": 0.1399, + "step": 28305 + }, + { + "epoch": 2.77, + "learning_rate": 1.8958206476612236e-05, + "loss": 0.1284, + "step": 28310 + }, + { + "epoch": 2.77, + "learning_rate": 1.8954054802103517e-05, + "loss": 0.0925, + "step": 28315 + }, + { + "epoch": 2.77, + "learning_rate": 1.8949903127594798e-05, + "loss": 0.1417, + "step": 28320 + }, + { + "epoch": 2.77, + "learning_rate": 1.894575145308608e-05, + "loss": 0.1317, + "step": 28325 + }, + { + "epoch": 2.77, + "learning_rate": 1.894159977857736e-05, + "loss": 0.1186, + "step": 28330 + }, + { + "epoch": 2.77, + "learning_rate": 1.893744810406864e-05, + "loss": 0.123, + "step": 28335 + }, + { + "epoch": 2.77, + "learning_rate": 1.893329642955992e-05, + "loss": 0.1315, + "step": 28340 + }, + { + "epoch": 2.77, + "learning_rate": 1.8929144755051202e-05, + "loss": 0.1207, + "step": 28345 + }, + { + "epoch": 2.77, + "learning_rate": 1.8924993080542486e-05, + "loss": 0.108, + "step": 28350 + }, + { + "epoch": 2.77, + "learning_rate": 1.892084140603377e-05, + "loss": 0.1282, + "step": 28355 + }, + { + "epoch": 2.77, + "learning_rate": 1.891668973152505e-05, + "loss": 0.1221, + "step": 28360 + }, + { + "epoch": 2.77, + "learning_rate": 1.8912538057016332e-05, + "loss": 0.1012, + "step": 28365 + }, + { + "epoch": 2.77, + "learning_rate": 1.8908386382507612e-05, + "loss": 0.1315, + "step": 28370 + }, + { + "epoch": 2.77, + "learning_rate": 1.8904234707998893e-05, + "loss": 0.1245, + "step": 28375 + }, + { + "epoch": 2.78, + "learning_rate": 1.8900083033490174e-05, + "loss": 0.1032, + "step": 28380 + }, + { + "epoch": 2.78, + "learning_rate": 1.8895931358981455e-05, + "loss": 0.119, + "step": 28385 + }, + { + "epoch": 2.78, + "learning_rate": 1.8891779684472736e-05, + "loss": 0.1339, + "step": 28390 + }, + { + "epoch": 2.78, + "learning_rate": 1.888762800996402e-05, + "loss": 0.114, + "step": 28395 + }, + { + "epoch": 2.78, + "learning_rate": 1.88834763354553e-05, + "loss": 0.1132, + "step": 28400 + }, + { + "epoch": 2.78, + "learning_rate": 1.8879324660946585e-05, + "loss": 0.1277, + "step": 28405 + }, + { + "epoch": 2.78, + "learning_rate": 1.8875172986437865e-05, + "loss": 0.1183, + "step": 28410 + }, + { + "epoch": 2.78, + "learning_rate": 1.8871021311929146e-05, + "loss": 0.114, + "step": 28415 + }, + { + "epoch": 2.78, + "learning_rate": 1.8866869637420427e-05, + "loss": 0.1319, + "step": 28420 + }, + { + "epoch": 2.78, + "learning_rate": 1.8862717962911708e-05, + "loss": 0.117, + "step": 28425 + }, + { + "epoch": 2.78, + "learning_rate": 1.885856628840299e-05, + "loss": 0.1049, + "step": 28430 + }, + { + "epoch": 2.78, + "learning_rate": 1.885441461389427e-05, + "loss": 0.1084, + "step": 28435 + }, + { + "epoch": 2.78, + "learning_rate": 1.8850262939385553e-05, + "loss": 0.1422, + "step": 28440 + }, + { + "epoch": 2.78, + "learning_rate": 1.8846111264876834e-05, + "loss": 0.121, + "step": 28445 + }, + { + "epoch": 2.78, + "learning_rate": 1.8841959590368115e-05, + "loss": 0.1161, + "step": 28450 + }, + { + "epoch": 2.78, + "learning_rate": 1.88378079158594e-05, + "loss": 0.1461, + "step": 28455 + }, + { + "epoch": 2.78, + "learning_rate": 1.883365624135068e-05, + "loss": 0.1185, + "step": 28460 + }, + { + "epoch": 2.78, + "learning_rate": 1.882950456684196e-05, + "loss": 0.108, + "step": 28465 + }, + { + "epoch": 2.78, + "learning_rate": 1.882535289233324e-05, + "loss": 0.1201, + "step": 28470 + }, + { + "epoch": 2.78, + "learning_rate": 1.8821201217824522e-05, + "loss": 0.1377, + "step": 28475 + }, + { + "epoch": 2.78, + "learning_rate": 1.8817049543315803e-05, + "loss": 0.0965, + "step": 28480 + }, + { + "epoch": 2.79, + "learning_rate": 1.8812897868807087e-05, + "loss": 0.1105, + "step": 28485 + }, + { + "epoch": 2.79, + "learning_rate": 1.8808746194298368e-05, + "loss": 0.1337, + "step": 28490 + }, + { + "epoch": 2.79, + "learning_rate": 1.880459451978965e-05, + "loss": 0.1099, + "step": 28495 + }, + { + "epoch": 2.79, + "learning_rate": 1.880044284528093e-05, + "loss": 0.1097, + "step": 28500 + }, + { + "epoch": 2.79, + "eval_cer": 0.060468794439395936, + "eval_loss": 0.24666650593280792, + "eval_runtime": 276.041, + "eval_samples_per_second": 59.303, + "eval_steps_per_second": 1.648, + "eval_wer": 0.1550250419542519, + "step": 28500 + }, + { + "epoch": 2.79, + "learning_rate": 1.879629117077221e-05, + "loss": 0.1522, + "step": 28505 + }, + { + "epoch": 2.79, + "learning_rate": 1.8792139496263494e-05, + "loss": 0.1135, + "step": 28510 + }, + { + "epoch": 2.79, + "learning_rate": 1.8787987821754775e-05, + "loss": 0.109, + "step": 28515 + }, + { + "epoch": 2.79, + "learning_rate": 1.8783836147246056e-05, + "loss": 0.1192, + "step": 28520 + }, + { + "epoch": 2.79, + "learning_rate": 1.8779684472737337e-05, + "loss": 0.1349, + "step": 28525 + }, + { + "epoch": 2.79, + "learning_rate": 1.877553279822862e-05, + "loss": 0.1113, + "step": 28530 + }, + { + "epoch": 2.79, + "learning_rate": 1.87713811237199e-05, + "loss": 0.1112, + "step": 28535 + }, + { + "epoch": 2.79, + "learning_rate": 1.8767229449211182e-05, + "loss": 0.1215, + "step": 28540 + }, + { + "epoch": 2.79, + "learning_rate": 1.8763077774702463e-05, + "loss": 0.1101, + "step": 28545 + }, + { + "epoch": 2.79, + "learning_rate": 1.8758926100193744e-05, + "loss": 0.1119, + "step": 28550 + }, + { + "epoch": 2.79, + "learning_rate": 1.8754774425685025e-05, + "loss": 0.1302, + "step": 28555 + }, + { + "epoch": 2.79, + "learning_rate": 1.875062275117631e-05, + "loss": 0.1204, + "step": 28560 + }, + { + "epoch": 2.79, + "learning_rate": 1.874647107666759e-05, + "loss": 0.1163, + "step": 28565 + }, + { + "epoch": 2.79, + "learning_rate": 1.8742319402158874e-05, + "loss": 0.1155, + "step": 28570 + }, + { + "epoch": 2.79, + "learning_rate": 1.8738167727650154e-05, + "loss": 0.1484, + "step": 28575 + }, + { + "epoch": 2.79, + "learning_rate": 1.8734016053141435e-05, + "loss": 0.1001, + "step": 28580 + }, + { + "epoch": 2.8, + "learning_rate": 1.8729864378632716e-05, + "loss": 0.1323, + "step": 28585 + }, + { + "epoch": 2.8, + "learning_rate": 1.8725712704123997e-05, + "loss": 0.1474, + "step": 28590 + }, + { + "epoch": 2.8, + "learning_rate": 1.8721561029615278e-05, + "loss": 0.1218, + "step": 28595 + }, + { + "epoch": 2.8, + "learning_rate": 1.871740935510656e-05, + "loss": 0.1119, + "step": 28600 + }, + { + "epoch": 2.8, + "learning_rate": 1.871325768059784e-05, + "loss": 0.1383, + "step": 28605 + }, + { + "epoch": 2.8, + "learning_rate": 1.8709106006089123e-05, + "loss": 0.1201, + "step": 28610 + }, + { + "epoch": 2.8, + "learning_rate": 1.8704954331580407e-05, + "loss": 0.0909, + "step": 28615 + }, + { + "epoch": 2.8, + "learning_rate": 1.8700802657071688e-05, + "loss": 0.1293, + "step": 28620 + }, + { + "epoch": 2.8, + "learning_rate": 1.869665098256297e-05, + "loss": 0.1341, + "step": 28625 + }, + { + "epoch": 2.8, + "learning_rate": 1.869249930805425e-05, + "loss": 0.1232, + "step": 28630 + }, + { + "epoch": 2.8, + "learning_rate": 1.868834763354553e-05, + "loss": 0.0994, + "step": 28635 + }, + { + "epoch": 2.8, + "learning_rate": 1.868419595903681e-05, + "loss": 0.1369, + "step": 28640 + }, + { + "epoch": 2.8, + "learning_rate": 1.8680044284528092e-05, + "loss": 0.1104, + "step": 28645 + }, + { + "epoch": 2.8, + "learning_rate": 1.8675892610019373e-05, + "loss": 0.1163, + "step": 28650 + }, + { + "epoch": 2.8, + "learning_rate": 1.8671740935510654e-05, + "loss": 0.1286, + "step": 28655 + }, + { + "epoch": 2.8, + "learning_rate": 1.866758926100194e-05, + "loss": 0.1156, + "step": 28660 + }, + { + "epoch": 2.8, + "learning_rate": 1.8663437586493222e-05, + "loss": 0.1171, + "step": 28665 + }, + { + "epoch": 2.8, + "learning_rate": 1.8660116246886243e-05, + "loss": 0.1175, + "step": 28670 + }, + { + "epoch": 2.8, + "learning_rate": 1.8655964572377524e-05, + "loss": 0.1569, + "step": 28675 + }, + { + "epoch": 2.8, + "learning_rate": 1.8651812897868805e-05, + "loss": 0.1147, + "step": 28680 + }, + { + "epoch": 2.8, + "learning_rate": 1.864766122336009e-05, + "loss": 0.1179, + "step": 28685 + }, + { + "epoch": 2.81, + "learning_rate": 1.8643509548851373e-05, + "loss": 0.1336, + "step": 28690 + }, + { + "epoch": 2.81, + "learning_rate": 1.8639357874342654e-05, + "loss": 0.1072, + "step": 28695 + }, + { + "epoch": 2.81, + "learning_rate": 1.8635206199833934e-05, + "loss": 0.1084, + "step": 28700 + }, + { + "epoch": 2.81, + "learning_rate": 1.8631054525325215e-05, + "loss": 0.1291, + "step": 28705 + }, + { + "epoch": 2.81, + "learning_rate": 1.8626902850816496e-05, + "loss": 0.1183, + "step": 28710 + }, + { + "epoch": 2.81, + "learning_rate": 1.8622751176307777e-05, + "loss": 0.1075, + "step": 28715 + }, + { + "epoch": 2.81, + "learning_rate": 1.8618599501799058e-05, + "loss": 0.1232, + "step": 28720 + }, + { + "epoch": 2.81, + "learning_rate": 1.861444782729034e-05, + "loss": 0.1336, + "step": 28725 + }, + { + "epoch": 2.81, + "learning_rate": 1.8610296152781622e-05, + "loss": 0.1197, + "step": 28730 + }, + { + "epoch": 2.81, + "learning_rate": 1.8606144478272907e-05, + "loss": 0.1151, + "step": 28735 + }, + { + "epoch": 2.81, + "learning_rate": 1.8601992803764187e-05, + "loss": 0.1384, + "step": 28740 + }, + { + "epoch": 2.81, + "learning_rate": 1.8597841129255468e-05, + "loss": 0.1096, + "step": 28745 + }, + { + "epoch": 2.81, + "learning_rate": 1.859368945474675e-05, + "loss": 0.1074, + "step": 28750 + }, + { + "epoch": 2.81, + "learning_rate": 1.858953778023803e-05, + "loss": 0.1519, + "step": 28755 + }, + { + "epoch": 2.81, + "learning_rate": 1.858538610572931e-05, + "loss": 0.1371, + "step": 28760 + }, + { + "epoch": 2.81, + "learning_rate": 1.858123443122059e-05, + "loss": 0.1046, + "step": 28765 + }, + { + "epoch": 2.81, + "learning_rate": 1.8577082756711872e-05, + "loss": 0.1466, + "step": 28770 + }, + { + "epoch": 2.81, + "learning_rate": 1.8572931082203156e-05, + "loss": 0.1398, + "step": 28775 + }, + { + "epoch": 2.81, + "learning_rate": 1.8568779407694437e-05, + "loss": 0.1119, + "step": 28780 + }, + { + "epoch": 2.81, + "learning_rate": 1.856462773318572e-05, + "loss": 0.1049, + "step": 28785 + }, + { + "epoch": 2.82, + "learning_rate": 1.8560476058677002e-05, + "loss": 0.1278, + "step": 28790 + }, + { + "epoch": 2.82, + "learning_rate": 1.8556324384168283e-05, + "loss": 0.1235, + "step": 28795 + }, + { + "epoch": 2.82, + "learning_rate": 1.8552172709659563e-05, + "loss": 0.1076, + "step": 28800 + }, + { + "epoch": 2.82, + "learning_rate": 1.8548021035150844e-05, + "loss": 0.15, + "step": 28805 + }, + { + "epoch": 2.82, + "learning_rate": 1.8543869360642125e-05, + "loss": 0.1225, + "step": 28810 + }, + { + "epoch": 2.82, + "learning_rate": 1.8539717686133406e-05, + "loss": 0.1105, + "step": 28815 + }, + { + "epoch": 2.82, + "learning_rate": 1.853556601162469e-05, + "loss": 0.1239, + "step": 28820 + }, + { + "epoch": 2.82, + "learning_rate": 1.853141433711597e-05, + "loss": 0.1361, + "step": 28825 + }, + { + "epoch": 2.82, + "learning_rate": 1.852726266260725e-05, + "loss": 0.112, + "step": 28830 + }, + { + "epoch": 2.82, + "learning_rate": 1.8523110988098536e-05, + "loss": 0.1114, + "step": 28835 + }, + { + "epoch": 2.82, + "learning_rate": 1.8518959313589816e-05, + "loss": 0.135, + "step": 28840 + }, + { + "epoch": 2.82, + "learning_rate": 1.8514807639081097e-05, + "loss": 0.1179, + "step": 28845 + }, + { + "epoch": 2.82, + "learning_rate": 1.8510655964572378e-05, + "loss": 0.112, + "step": 28850 + }, + { + "epoch": 2.82, + "learning_rate": 1.850650429006366e-05, + "loss": 0.1402, + "step": 28855 + }, + { + "epoch": 2.82, + "learning_rate": 1.850235261555494e-05, + "loss": 0.1322, + "step": 28860 + }, + { + "epoch": 2.82, + "learning_rate": 1.8498200941046224e-05, + "loss": 0.0959, + "step": 28865 + }, + { + "epoch": 2.82, + "learning_rate": 1.8494049266537504e-05, + "loss": 0.1276, + "step": 28870 + }, + { + "epoch": 2.82, + "learning_rate": 1.8489897592028785e-05, + "loss": 0.1438, + "step": 28875 + }, + { + "epoch": 2.82, + "learning_rate": 1.8485745917520066e-05, + "loss": 0.1343, + "step": 28880 + }, + { + "epoch": 2.82, + "learning_rate": 1.8481594243011347e-05, + "loss": 0.0999, + "step": 28885 + }, + { + "epoch": 2.82, + "learning_rate": 1.847744256850263e-05, + "loss": 0.1485, + "step": 28890 + }, + { + "epoch": 2.83, + "learning_rate": 1.847329089399391e-05, + "loss": 0.1113, + "step": 28895 + }, + { + "epoch": 2.83, + "learning_rate": 1.8469139219485192e-05, + "loss": 0.1199, + "step": 28900 + }, + { + "epoch": 2.83, + "learning_rate": 1.8464987544976473e-05, + "loss": 0.1367, + "step": 28905 + }, + { + "epoch": 2.83, + "learning_rate": 1.8460835870467757e-05, + "loss": 0.1102, + "step": 28910 + }, + { + "epoch": 2.83, + "learning_rate": 1.8456684195959038e-05, + "loss": 0.1185, + "step": 28915 + }, + { + "epoch": 2.83, + "learning_rate": 1.845253252145032e-05, + "loss": 0.1101, + "step": 28920 + }, + { + "epoch": 2.83, + "learning_rate": 1.84483808469416e-05, + "loss": 0.1205, + "step": 28925 + }, + { + "epoch": 2.83, + "learning_rate": 1.844422917243288e-05, + "loss": 0.1044, + "step": 28930 + }, + { + "epoch": 2.83, + "learning_rate": 1.844007749792416e-05, + "loss": 0.1173, + "step": 28935 + }, + { + "epoch": 2.83, + "learning_rate": 1.8435925823415445e-05, + "loss": 0.131, + "step": 28940 + }, + { + "epoch": 2.83, + "learning_rate": 1.8431774148906726e-05, + "loss": 0.1197, + "step": 28945 + }, + { + "epoch": 2.83, + "learning_rate": 1.842762247439801e-05, + "loss": 0.1163, + "step": 28950 + }, + { + "epoch": 2.83, + "learning_rate": 1.842347079988929e-05, + "loss": 0.1255, + "step": 28955 + }, + { + "epoch": 2.83, + "learning_rate": 1.8419319125380572e-05, + "loss": 0.1287, + "step": 28960 + }, + { + "epoch": 2.83, + "learning_rate": 1.8415167450871852e-05, + "loss": 0.1169, + "step": 28965 + }, + { + "epoch": 2.83, + "learning_rate": 1.8411015776363133e-05, + "loss": 0.1319, + "step": 28970 + }, + { + "epoch": 2.83, + "learning_rate": 1.8406864101854414e-05, + "loss": 0.1363, + "step": 28975 + }, + { + "epoch": 2.83, + "learning_rate": 1.8402712427345695e-05, + "loss": 0.1025, + "step": 28980 + }, + { + "epoch": 2.83, + "learning_rate": 1.8398560752836976e-05, + "loss": 0.1064, + "step": 28985 + }, + { + "epoch": 2.83, + "learning_rate": 1.839440907832826e-05, + "loss": 0.1438, + "step": 28990 + }, + { + "epoch": 2.84, + "learning_rate": 1.8390257403819544e-05, + "loss": 0.1236, + "step": 28995 + }, + { + "epoch": 2.84, + "learning_rate": 1.8386105729310825e-05, + "loss": 0.1253, + "step": 29000 + }, + { + "epoch": 2.84, + "eval_cer": 0.059995930362960755, + "eval_loss": 0.24278943240642548, + "eval_runtime": 273.6008, + "eval_samples_per_second": 59.832, + "eval_steps_per_second": 1.663, + "eval_wer": 0.15408474432393254, + "step": 29000 + }, + { + "epoch": 2.84, + "learning_rate": 1.8381954054802105e-05, + "loss": 0.1437, + "step": 29005 + }, + { + "epoch": 2.84, + "learning_rate": 1.8377802380293386e-05, + "loss": 0.1164, + "step": 29010 + }, + { + "epoch": 2.84, + "learning_rate": 1.8373650705784667e-05, + "loss": 0.1046, + "step": 29015 + }, + { + "epoch": 2.84, + "learning_rate": 1.8369499031275948e-05, + "loss": 0.1198, + "step": 29020 + }, + { + "epoch": 2.84, + "learning_rate": 1.836534735676723e-05, + "loss": 0.1262, + "step": 29025 + }, + { + "epoch": 2.84, + "learning_rate": 1.836119568225851e-05, + "loss": 0.1172, + "step": 29030 + }, + { + "epoch": 2.84, + "learning_rate": 1.835704400774979e-05, + "loss": 0.1263, + "step": 29035 + }, + { + "epoch": 2.84, + "learning_rate": 1.8352892333241074e-05, + "loss": 0.1433, + "step": 29040 + }, + { + "epoch": 2.84, + "learning_rate": 1.834874065873236e-05, + "loss": 0.1163, + "step": 29045 + }, + { + "epoch": 2.84, + "learning_rate": 1.834458898422364e-05, + "loss": 0.1098, + "step": 29050 + }, + { + "epoch": 2.84, + "learning_rate": 1.834043730971492e-05, + "loss": 0.122, + "step": 29055 + }, + { + "epoch": 2.84, + "learning_rate": 1.83362856352062e-05, + "loss": 0.1233, + "step": 29060 + }, + { + "epoch": 2.84, + "learning_rate": 1.833213396069748e-05, + "loss": 0.1009, + "step": 29065 + }, + { + "epoch": 2.84, + "learning_rate": 1.8327982286188762e-05, + "loss": 0.1187, + "step": 29070 + }, + { + "epoch": 2.84, + "learning_rate": 1.8323830611680043e-05, + "loss": 0.1269, + "step": 29075 + }, + { + "epoch": 2.84, + "learning_rate": 1.8319678937171324e-05, + "loss": 0.1042, + "step": 29080 + }, + { + "epoch": 2.84, + "learning_rate": 1.8315527262662608e-05, + "loss": 0.1181, + "step": 29085 + }, + { + "epoch": 2.84, + "learning_rate": 1.831137558815389e-05, + "loss": 0.1432, + "step": 29090 + }, + { + "epoch": 2.85, + "learning_rate": 1.8307223913645173e-05, + "loss": 0.1148, + "step": 29095 + }, + { + "epoch": 2.85, + "learning_rate": 1.8303072239136454e-05, + "loss": 0.1046, + "step": 29100 + }, + { + "epoch": 2.85, + "learning_rate": 1.8298920564627734e-05, + "loss": 0.1316, + "step": 29105 + }, + { + "epoch": 2.85, + "learning_rate": 1.8294768890119015e-05, + "loss": 0.1223, + "step": 29110 + }, + { + "epoch": 2.85, + "learning_rate": 1.8290617215610296e-05, + "loss": 0.1088, + "step": 29115 + }, + { + "epoch": 2.85, + "learning_rate": 1.8286465541101577e-05, + "loss": 0.1487, + "step": 29120 + }, + { + "epoch": 2.85, + "learning_rate": 1.8282313866592857e-05, + "loss": 0.1251, + "step": 29125 + }, + { + "epoch": 2.85, + "learning_rate": 1.827816219208414e-05, + "loss": 0.1034, + "step": 29130 + }, + { + "epoch": 2.85, + "learning_rate": 1.8274010517575422e-05, + "loss": 0.1063, + "step": 29135 + }, + { + "epoch": 2.85, + "learning_rate": 1.8269858843066703e-05, + "loss": 0.1358, + "step": 29140 + }, + { + "epoch": 2.85, + "learning_rate": 1.8265707168557987e-05, + "loss": 0.118, + "step": 29145 + }, + { + "epoch": 2.85, + "learning_rate": 1.8261555494049268e-05, + "loss": 0.1164, + "step": 29150 + }, + { + "epoch": 2.85, + "learning_rate": 1.825740381954055e-05, + "loss": 0.1206, + "step": 29155 + }, + { + "epoch": 2.85, + "learning_rate": 1.825325214503183e-05, + "loss": 0.125, + "step": 29160 + }, + { + "epoch": 2.85, + "learning_rate": 1.824910047052311e-05, + "loss": 0.1192, + "step": 29165 + }, + { + "epoch": 2.85, + "learning_rate": 1.8244948796014394e-05, + "loss": 0.1139, + "step": 29170 + }, + { + "epoch": 2.85, + "learning_rate": 1.8240797121505675e-05, + "loss": 0.1333, + "step": 29175 + }, + { + "epoch": 2.85, + "learning_rate": 1.8236645446996956e-05, + "loss": 0.1113, + "step": 29180 + }, + { + "epoch": 2.85, + "learning_rate": 1.8232493772488237e-05, + "loss": 0.1143, + "step": 29185 + }, + { + "epoch": 2.85, + "learning_rate": 1.8228342097979518e-05, + "loss": 0.1445, + "step": 29190 + }, + { + "epoch": 2.85, + "learning_rate": 1.82241904234708e-05, + "loss": 0.1176, + "step": 29195 + }, + { + "epoch": 2.86, + "learning_rate": 1.8220038748962082e-05, + "loss": 0.1296, + "step": 29200 + }, + { + "epoch": 2.86, + "learning_rate": 1.8215887074453363e-05, + "loss": 0.1438, + "step": 29205 + }, + { + "epoch": 2.86, + "learning_rate": 1.8211735399944644e-05, + "loss": 0.1322, + "step": 29210 + }, + { + "epoch": 2.86, + "learning_rate": 1.8207583725435928e-05, + "loss": 0.1177, + "step": 29215 + }, + { + "epoch": 2.86, + "learning_rate": 1.820343205092721e-05, + "loss": 0.128, + "step": 29220 + }, + { + "epoch": 2.86, + "learning_rate": 1.819928037641849e-05, + "loss": 0.1484, + "step": 29225 + }, + { + "epoch": 2.86, + "learning_rate": 1.819512870190977e-05, + "loss": 0.1111, + "step": 29230 + }, + { + "epoch": 2.86, + "learning_rate": 1.819097702740105e-05, + "loss": 0.1147, + "step": 29235 + }, + { + "epoch": 2.86, + "learning_rate": 1.8186825352892332e-05, + "loss": 0.1317, + "step": 29240 + }, + { + "epoch": 2.86, + "learning_rate": 1.8182673678383616e-05, + "loss": 0.1055, + "step": 29245 + }, + { + "epoch": 2.86, + "learning_rate": 1.8178522003874897e-05, + "loss": 0.1209, + "step": 29250 + }, + { + "epoch": 2.86, + "learning_rate": 1.8174370329366178e-05, + "loss": 0.1465, + "step": 29255 + }, + { + "epoch": 2.86, + "learning_rate": 1.8170218654857462e-05, + "loss": 0.1298, + "step": 29260 + }, + { + "epoch": 2.86, + "learning_rate": 1.8166066980348743e-05, + "loss": 0.1142, + "step": 29265 + }, + { + "epoch": 2.86, + "learning_rate": 1.8161915305840023e-05, + "loss": 0.1304, + "step": 29270 + }, + { + "epoch": 2.86, + "learning_rate": 1.8157763631331304e-05, + "loss": 0.13, + "step": 29275 + }, + { + "epoch": 2.86, + "learning_rate": 1.8153611956822585e-05, + "loss": 0.1077, + "step": 29280 + }, + { + "epoch": 2.86, + "learning_rate": 1.8149460282313866e-05, + "loss": 0.1099, + "step": 29285 + }, + { + "epoch": 2.86, + "learning_rate": 1.8145308607805146e-05, + "loss": 0.1457, + "step": 29290 + }, + { + "epoch": 2.86, + "learning_rate": 1.8141156933296427e-05, + "loss": 0.1178, + "step": 29295 + }, + { + "epoch": 2.87, + "learning_rate": 1.813700525878771e-05, + "loss": 0.1017, + "step": 29300 + }, + { + "epoch": 2.87, + "learning_rate": 1.8132853584278996e-05, + "loss": 0.1432, + "step": 29305 + }, + { + "epoch": 2.87, + "learning_rate": 1.8128701909770276e-05, + "loss": 0.126, + "step": 29310 + }, + { + "epoch": 2.87, + "learning_rate": 1.8124550235261557e-05, + "loss": 0.1106, + "step": 29315 + }, + { + "epoch": 2.87, + "learning_rate": 1.8120398560752838e-05, + "loss": 0.1213, + "step": 29320 + }, + { + "epoch": 2.87, + "learning_rate": 1.811624688624412e-05, + "loss": 0.1302, + "step": 29325 + }, + { + "epoch": 2.87, + "learning_rate": 1.81120952117354e-05, + "loss": 0.1011, + "step": 29330 + }, + { + "epoch": 2.87, + "learning_rate": 1.810794353722668e-05, + "loss": 0.1304, + "step": 29335 + }, + { + "epoch": 2.87, + "learning_rate": 1.810379186271796e-05, + "loss": 0.1194, + "step": 29340 + }, + { + "epoch": 2.87, + "learning_rate": 1.809964018820924e-05, + "loss": 0.1166, + "step": 29345 + }, + { + "epoch": 2.87, + "learning_rate": 1.809548851370053e-05, + "loss": 0.106, + "step": 29350 + }, + { + "epoch": 2.87, + "learning_rate": 1.809133683919181e-05, + "loss": 0.1175, + "step": 29355 + }, + { + "epoch": 2.87, + "learning_rate": 1.808718516468309e-05, + "loss": 0.1169, + "step": 29360 + }, + { + "epoch": 2.87, + "learning_rate": 1.808303349017437e-05, + "loss": 0.1089, + "step": 29365 + }, + { + "epoch": 2.87, + "learning_rate": 1.8078881815665652e-05, + "loss": 0.1241, + "step": 29370 + }, + { + "epoch": 2.87, + "learning_rate": 1.8074730141156933e-05, + "loss": 0.1402, + "step": 29375 + }, + { + "epoch": 2.87, + "learning_rate": 1.8070578466648214e-05, + "loss": 0.116, + "step": 29380 + }, + { + "epoch": 2.87, + "learning_rate": 1.8066426792139495e-05, + "loss": 0.1144, + "step": 29385 + }, + { + "epoch": 2.87, + "learning_rate": 1.8062275117630775e-05, + "loss": 0.156, + "step": 29390 + }, + { + "epoch": 2.87, + "learning_rate": 1.805812344312206e-05, + "loss": 0.1068, + "step": 29395 + }, + { + "epoch": 2.87, + "learning_rate": 1.8053971768613344e-05, + "loss": 0.1192, + "step": 29400 + }, + { + "epoch": 2.88, + "learning_rate": 1.8049820094104624e-05, + "loss": 0.1228, + "step": 29405 + }, + { + "epoch": 2.88, + "learning_rate": 1.8045668419595905e-05, + "loss": 0.1075, + "step": 29410 + }, + { + "epoch": 2.88, + "learning_rate": 1.8041516745087186e-05, + "loss": 0.1065, + "step": 29415 + }, + { + "epoch": 2.88, + "learning_rate": 1.8037365070578467e-05, + "loss": 0.1129, + "step": 29420 + }, + { + "epoch": 2.88, + "learning_rate": 1.8033213396069748e-05, + "loss": 0.139, + "step": 29425 + }, + { + "epoch": 2.88, + "learning_rate": 1.8029061721561028e-05, + "loss": 0.0984, + "step": 29430 + }, + { + "epoch": 2.88, + "learning_rate": 1.8024910047052312e-05, + "loss": 0.1222, + "step": 29435 + }, + { + "epoch": 2.88, + "learning_rate": 1.8020758372543593e-05, + "loss": 0.1366, + "step": 29440 + }, + { + "epoch": 2.88, + "learning_rate": 1.8016606698034874e-05, + "loss": 0.109, + "step": 29445 + }, + { + "epoch": 2.88, + "learning_rate": 1.8012455023526158e-05, + "loss": 0.1236, + "step": 29450 + }, + { + "epoch": 2.88, + "learning_rate": 1.800830334901744e-05, + "loss": 0.1253, + "step": 29455 + }, + { + "epoch": 2.88, + "learning_rate": 1.800415167450872e-05, + "loss": 0.1073, + "step": 29460 + }, + { + "epoch": 2.88, + "learning_rate": 1.8e-05, + "loss": 0.0905, + "step": 29465 + }, + { + "epoch": 2.88, + "learning_rate": 1.799584832549128e-05, + "loss": 0.1274, + "step": 29470 + }, + { + "epoch": 2.88, + "learning_rate": 1.7991696650982562e-05, + "loss": 0.1263, + "step": 29475 + }, + { + "epoch": 2.88, + "learning_rate": 1.7987544976473846e-05, + "loss": 0.1137, + "step": 29480 + }, + { + "epoch": 2.88, + "learning_rate": 1.7983393301965127e-05, + "loss": 0.1245, + "step": 29485 + }, + { + "epoch": 2.88, + "learning_rate": 1.7979241627456408e-05, + "loss": 0.1634, + "step": 29490 + }, + { + "epoch": 2.88, + "learning_rate": 1.797508995294769e-05, + "loss": 0.1065, + "step": 29495 + }, + { + "epoch": 2.88, + "learning_rate": 1.797093827843897e-05, + "loss": 0.1172, + "step": 29500 + }, + { + "epoch": 2.88, + "eval_cer": 0.059234029564988175, + "eval_loss": 0.2398531287908554, + "eval_runtime": 276.8437, + "eval_samples_per_second": 59.131, + "eval_steps_per_second": 1.644, + "eval_wer": 0.1512965006562494, + "step": 29500 + }, + { + "epoch": 2.89, + "learning_rate": 1.7966786603930253e-05, + "loss": 0.1304, + "step": 29505 + }, + { + "epoch": 2.89, + "learning_rate": 1.7962634929421534e-05, + "loss": 0.1178, + "step": 29510 + }, + { + "epoch": 2.89, + "learning_rate": 1.7958483254912815e-05, + "loss": 0.1077, + "step": 29515 + }, + { + "epoch": 2.89, + "learning_rate": 1.7954331580404096e-05, + "loss": 0.1124, + "step": 29520 + }, + { + "epoch": 2.89, + "learning_rate": 1.795017990589538e-05, + "loss": 0.1275, + "step": 29525 + }, + { + "epoch": 2.89, + "learning_rate": 1.794602823138666e-05, + "loss": 0.117, + "step": 29530 + }, + { + "epoch": 2.89, + "learning_rate": 1.794187655687794e-05, + "loss": 0.1179, + "step": 29535 + }, + { + "epoch": 2.89, + "learning_rate": 1.7937724882369222e-05, + "loss": 0.1249, + "step": 29540 + }, + { + "epoch": 2.89, + "learning_rate": 1.7933573207860503e-05, + "loss": 0.113, + "step": 29545 + }, + { + "epoch": 2.89, + "learning_rate": 1.7929421533351784e-05, + "loss": 0.0963, + "step": 29550 + }, + { + "epoch": 2.89, + "learning_rate": 1.7925269858843068e-05, + "loss": 0.1328, + "step": 29555 + }, + { + "epoch": 2.89, + "learning_rate": 1.792111818433435e-05, + "loss": 0.1077, + "step": 29560 + }, + { + "epoch": 2.89, + "learning_rate": 1.791696650982563e-05, + "loss": 0.1117, + "step": 29565 + }, + { + "epoch": 2.89, + "learning_rate": 1.7912814835316914e-05, + "loss": 0.1389, + "step": 29570 + }, + { + "epoch": 2.89, + "learning_rate": 1.7908663160808194e-05, + "loss": 0.137, + "step": 29575 + }, + { + "epoch": 2.89, + "learning_rate": 1.7904511486299475e-05, + "loss": 0.104, + "step": 29580 + }, + { + "epoch": 2.89, + "learning_rate": 1.7900359811790756e-05, + "loss": 0.1083, + "step": 29585 + }, + { + "epoch": 2.89, + "learning_rate": 1.7896208137282037e-05, + "loss": 0.1596, + "step": 29590 + }, + { + "epoch": 2.89, + "learning_rate": 1.7892056462773317e-05, + "loss": 0.1083, + "step": 29595 + }, + { + "epoch": 2.89, + "learning_rate": 1.7887904788264598e-05, + "loss": 0.1228, + "step": 29600 + }, + { + "epoch": 2.89, + "learning_rate": 1.7883753113755882e-05, + "loss": 0.1391, + "step": 29605 + }, + { + "epoch": 2.9, + "learning_rate": 1.7879601439247163e-05, + "loss": 0.1222, + "step": 29610 + }, + { + "epoch": 2.9, + "learning_rate": 1.7875449764738447e-05, + "loss": 0.1155, + "step": 29615 + }, + { + "epoch": 2.9, + "learning_rate": 1.7871298090229728e-05, + "loss": 0.1357, + "step": 29620 + }, + { + "epoch": 2.9, + "learning_rate": 1.786714641572101e-05, + "loss": 0.1378, + "step": 29625 + }, + { + "epoch": 2.9, + "learning_rate": 1.786299474121229e-05, + "loss": 0.1111, + "step": 29630 + }, + { + "epoch": 2.9, + "learning_rate": 1.785884306670357e-05, + "loss": 0.1061, + "step": 29635 + }, + { + "epoch": 2.9, + "learning_rate": 1.785469139219485e-05, + "loss": 0.1398, + "step": 29640 + }, + { + "epoch": 2.9, + "learning_rate": 1.7850539717686132e-05, + "loss": 0.1113, + "step": 29645 + }, + { + "epoch": 2.9, + "learning_rate": 1.7846388043177413e-05, + "loss": 0.098, + "step": 29650 + }, + { + "epoch": 2.9, + "learning_rate": 1.7842236368668697e-05, + "loss": 0.1283, + "step": 29655 + }, + { + "epoch": 2.9, + "learning_rate": 1.783808469415998e-05, + "loss": 0.1032, + "step": 29660 + }, + { + "epoch": 2.9, + "learning_rate": 1.783393301965126e-05, + "loss": 0.1085, + "step": 29665 + }, + { + "epoch": 2.9, + "learning_rate": 1.7829781345142542e-05, + "loss": 0.1232, + "step": 29670 + }, + { + "epoch": 2.9, + "learning_rate": 1.7825629670633823e-05, + "loss": 0.1287, + "step": 29675 + }, + { + "epoch": 2.9, + "learning_rate": 1.7821477996125104e-05, + "loss": 0.1069, + "step": 29680 + }, + { + "epoch": 2.9, + "learning_rate": 1.7817326321616385e-05, + "loss": 0.1093, + "step": 29685 + }, + { + "epoch": 2.9, + "learning_rate": 1.7813174647107666e-05, + "loss": 0.1444, + "step": 29690 + }, + { + "epoch": 2.9, + "learning_rate": 1.7809022972598946e-05, + "loss": 0.1314, + "step": 29695 + }, + { + "epoch": 2.9, + "learning_rate": 1.780487129809023e-05, + "loss": 0.1177, + "step": 29700 + }, + { + "epoch": 2.9, + "learning_rate": 1.780071962358151e-05, + "loss": 0.111, + "step": 29705 + }, + { + "epoch": 2.91, + "learning_rate": 1.7796567949072795e-05, + "loss": 0.1132, + "step": 29710 + }, + { + "epoch": 2.91, + "learning_rate": 1.7792416274564076e-05, + "loss": 0.1124, + "step": 29715 + }, + { + "epoch": 2.91, + "learning_rate": 1.7788264600055357e-05, + "loss": 0.1313, + "step": 29720 + }, + { + "epoch": 2.91, + "learning_rate": 1.7784112925546638e-05, + "loss": 0.1341, + "step": 29725 + }, + { + "epoch": 2.91, + "learning_rate": 1.777996125103792e-05, + "loss": 0.1055, + "step": 29730 + }, + { + "epoch": 2.91, + "learning_rate": 1.77758095765292e-05, + "loss": 0.109, + "step": 29735 + }, + { + "epoch": 2.91, + "learning_rate": 1.777165790202048e-05, + "loss": 0.1386, + "step": 29740 + }, + { + "epoch": 2.91, + "learning_rate": 1.7767506227511764e-05, + "loss": 0.109, + "step": 29745 + }, + { + "epoch": 2.91, + "learning_rate": 1.7763354553003045e-05, + "loss": 0.1159, + "step": 29750 + }, + { + "epoch": 2.91, + "learning_rate": 1.776003321339607e-05, + "loss": 0.1145, + "step": 29755 + }, + { + "epoch": 2.91, + "learning_rate": 1.775588153888735e-05, + "loss": 0.1102, + "step": 29760 + }, + { + "epoch": 2.91, + "learning_rate": 1.775172986437863e-05, + "loss": 0.1119, + "step": 29765 + }, + { + "epoch": 2.91, + "learning_rate": 1.7747578189869912e-05, + "loss": 0.1153, + "step": 29770 + }, + { + "epoch": 2.91, + "learning_rate": 1.7743426515361196e-05, + "loss": 0.1371, + "step": 29775 + }, + { + "epoch": 2.91, + "learning_rate": 1.773927484085248e-05, + "loss": 0.1162, + "step": 29780 + }, + { + "epoch": 2.91, + "learning_rate": 1.773512316634376e-05, + "loss": 0.1132, + "step": 29785 + }, + { + "epoch": 2.91, + "learning_rate": 1.773097149183504e-05, + "loss": 0.1335, + "step": 29790 + }, + { + "epoch": 2.91, + "learning_rate": 1.7726819817326322e-05, + "loss": 0.1201, + "step": 29795 + }, + { + "epoch": 2.91, + "learning_rate": 1.7722668142817603e-05, + "loss": 0.1188, + "step": 29800 + }, + { + "epoch": 2.91, + "learning_rate": 1.7718516468308884e-05, + "loss": 0.1184, + "step": 29805 + }, + { + "epoch": 2.91, + "learning_rate": 1.7714364793800165e-05, + "loss": 0.1143, + "step": 29810 + }, + { + "epoch": 2.92, + "learning_rate": 1.771021311929145e-05, + "loss": 0.1321, + "step": 29815 + }, + { + "epoch": 2.92, + "learning_rate": 1.770606144478273e-05, + "loss": 0.1036, + "step": 29820 + }, + { + "epoch": 2.92, + "learning_rate": 1.770190977027401e-05, + "loss": 0.147, + "step": 29825 + }, + { + "epoch": 2.92, + "learning_rate": 1.7697758095765295e-05, + "loss": 0.1146, + "step": 29830 + }, + { + "epoch": 2.92, + "learning_rate": 1.7693606421256575e-05, + "loss": 0.1215, + "step": 29835 + }, + { + "epoch": 2.92, + "learning_rate": 1.7689454746747856e-05, + "loss": 0.1509, + "step": 29840 + }, + { + "epoch": 2.92, + "learning_rate": 1.7685303072239137e-05, + "loss": 0.1339, + "step": 29845 + }, + { + "epoch": 2.92, + "learning_rate": 1.7681151397730418e-05, + "loss": 0.1171, + "step": 29850 + }, + { + "epoch": 2.92, + "learning_rate": 1.76769997232217e-05, + "loss": 0.1157, + "step": 29855 + }, + { + "epoch": 2.92, + "learning_rate": 1.7672848048712983e-05, + "loss": 0.112, + "step": 29860 + }, + { + "epoch": 2.92, + "learning_rate": 1.7668696374204263e-05, + "loss": 0.1174, + "step": 29865 + }, + { + "epoch": 2.92, + "learning_rate": 1.7664544699695544e-05, + "loss": 0.1252, + "step": 29870 + }, + { + "epoch": 2.92, + "learning_rate": 1.7660393025186825e-05, + "loss": 0.1214, + "step": 29875 + }, + { + "epoch": 2.92, + "learning_rate": 1.7656241350678106e-05, + "loss": 0.1162, + "step": 29880 + }, + { + "epoch": 2.92, + "learning_rate": 1.765208967616939e-05, + "loss": 0.125, + "step": 29885 + }, + { + "epoch": 2.92, + "learning_rate": 1.764793800166067e-05, + "loss": 0.1272, + "step": 29890 + }, + { + "epoch": 2.92, + "learning_rate": 1.764378632715195e-05, + "loss": 0.1103, + "step": 29895 + }, + { + "epoch": 2.92, + "learning_rate": 1.7639634652643232e-05, + "loss": 0.1041, + "step": 29900 + }, + { + "epoch": 2.92, + "learning_rate": 1.7635482978134516e-05, + "loss": 0.1271, + "step": 29905 + }, + { + "epoch": 2.92, + "learning_rate": 1.7631331303625797e-05, + "loss": 0.119, + "step": 29910 + }, + { + "epoch": 2.93, + "learning_rate": 1.7627179629117078e-05, + "loss": 0.1107, + "step": 29915 + }, + { + "epoch": 2.93, + "learning_rate": 1.762302795460836e-05, + "loss": 0.136, + "step": 29920 + }, + { + "epoch": 2.93, + "learning_rate": 1.761887628009964e-05, + "loss": 0.1187, + "step": 29925 + }, + { + "epoch": 2.93, + "learning_rate": 1.761472460559092e-05, + "loss": 0.105, + "step": 29930 + }, + { + "epoch": 2.93, + "learning_rate": 1.7610572931082204e-05, + "loss": 0.1097, + "step": 29935 + }, + { + "epoch": 2.93, + "learning_rate": 1.7606421256573485e-05, + "loss": 0.1475, + "step": 29940 + }, + { + "epoch": 2.93, + "learning_rate": 1.7602269582064766e-05, + "loss": 0.1221, + "step": 29945 + }, + { + "epoch": 2.93, + "learning_rate": 1.759811790755605e-05, + "loss": 0.1242, + "step": 29950 + }, + { + "epoch": 2.93, + "learning_rate": 1.759396623304733e-05, + "loss": 0.1314, + "step": 29955 + }, + { + "epoch": 2.93, + "learning_rate": 1.758981455853861e-05, + "loss": 0.1115, + "step": 29960 + }, + { + "epoch": 2.93, + "learning_rate": 1.7585662884029892e-05, + "loss": 0.1083, + "step": 29965 + }, + { + "epoch": 2.93, + "learning_rate": 1.7581511209521173e-05, + "loss": 0.1181, + "step": 29970 + }, + { + "epoch": 2.93, + "learning_rate": 1.7577359535012454e-05, + "loss": 0.1271, + "step": 29975 + }, + { + "epoch": 2.93, + "learning_rate": 1.7573207860503735e-05, + "loss": 0.1242, + "step": 29980 + }, + { + "epoch": 2.93, + "learning_rate": 1.756905618599502e-05, + "loss": 0.1041, + "step": 29985 + }, + { + "epoch": 2.93, + "learning_rate": 1.75649045114863e-05, + "loss": 0.1294, + "step": 29990 + }, + { + "epoch": 2.93, + "learning_rate": 1.7560752836977584e-05, + "loss": 0.1144, + "step": 29995 + }, + { + "epoch": 2.93, + "learning_rate": 1.7556601162468864e-05, + "loss": 0.12, + "step": 30000 + }, + { + "epoch": 2.93, + "eval_cer": 0.05892996293393083, + "eval_loss": 0.23929035663604736, + "eval_runtime": 274.2792, + "eval_samples_per_second": 59.684, + "eval_steps_per_second": 1.659, + "eval_wer": 0.15181888822864903, + "step": 30000 + }, + { + "epoch": 2.93, + "learning_rate": 1.7552449487960145e-05, + "loss": 0.1221, + "step": 30005 + }, + { + "epoch": 2.93, + "learning_rate": 1.7548297813451426e-05, + "loss": 0.1121, + "step": 30010 + }, + { + "epoch": 2.93, + "learning_rate": 1.7544146138942707e-05, + "loss": 0.1195, + "step": 30015 + }, + { + "epoch": 2.94, + "learning_rate": 1.7539994464433988e-05, + "loss": 0.1099, + "step": 30020 + }, + { + "epoch": 2.94, + "learning_rate": 1.7535842789925268e-05, + "loss": 0.1168, + "step": 30025 + }, + { + "epoch": 2.94, + "learning_rate": 1.753169111541655e-05, + "loss": 0.1055, + "step": 30030 + }, + { + "epoch": 2.94, + "learning_rate": 1.7527539440907833e-05, + "loss": 0.1003, + "step": 30035 + }, + { + "epoch": 2.94, + "learning_rate": 1.7523387766399117e-05, + "loss": 0.1327, + "step": 30040 + }, + { + "epoch": 2.94, + "learning_rate": 1.7519236091890398e-05, + "loss": 0.0994, + "step": 30045 + }, + { + "epoch": 2.94, + "learning_rate": 1.751508441738168e-05, + "loss": 0.1136, + "step": 30050 + }, + { + "epoch": 2.94, + "learning_rate": 1.751093274287296e-05, + "loss": 0.1414, + "step": 30055 + }, + { + "epoch": 2.94, + "learning_rate": 1.750678106836424e-05, + "loss": 0.1252, + "step": 30060 + }, + { + "epoch": 2.94, + "learning_rate": 1.750262939385552e-05, + "loss": 0.108, + "step": 30065 + }, + { + "epoch": 2.94, + "learning_rate": 1.7498477719346802e-05, + "loss": 0.1155, + "step": 30070 + }, + { + "epoch": 2.94, + "learning_rate": 1.7494326044838083e-05, + "loss": 0.1199, + "step": 30075 + }, + { + "epoch": 2.94, + "learning_rate": 1.7490174370329367e-05, + "loss": 0.127, + "step": 30080 + }, + { + "epoch": 2.94, + "learning_rate": 1.7486022695820648e-05, + "loss": 0.1242, + "step": 30085 + }, + { + "epoch": 2.94, + "learning_rate": 1.7481871021311932e-05, + "loss": 0.1192, + "step": 30090 + }, + { + "epoch": 2.94, + "learning_rate": 1.7477719346803213e-05, + "loss": 0.108, + "step": 30095 + }, + { + "epoch": 2.94, + "learning_rate": 1.7473567672294493e-05, + "loss": 0.1178, + "step": 30100 + }, + { + "epoch": 2.94, + "learning_rate": 1.7469415997785774e-05, + "loss": 0.1331, + "step": 30105 + }, + { + "epoch": 2.94, + "learning_rate": 1.7465264323277055e-05, + "loss": 0.1168, + "step": 30110 + }, + { + "epoch": 2.94, + "learning_rate": 1.7461112648768336e-05, + "loss": 0.0961, + "step": 30115 + }, + { + "epoch": 2.95, + "learning_rate": 1.7456960974259616e-05, + "loss": 0.1329, + "step": 30120 + }, + { + "epoch": 2.95, + "learning_rate": 1.74528092997509e-05, + "loss": 0.1414, + "step": 30125 + }, + { + "epoch": 2.95, + "learning_rate": 1.744865762524218e-05, + "loss": 0.1007, + "step": 30130 + }, + { + "epoch": 2.95, + "learning_rate": 1.7444505950733462e-05, + "loss": 0.1227, + "step": 30135 + }, + { + "epoch": 2.95, + "learning_rate": 1.7440354276224746e-05, + "loss": 0.1374, + "step": 30140 + }, + { + "epoch": 2.95, + "learning_rate": 1.7436202601716027e-05, + "loss": 0.1206, + "step": 30145 + }, + { + "epoch": 2.95, + "learning_rate": 1.7432050927207308e-05, + "loss": 0.0981, + "step": 30150 + }, + { + "epoch": 2.95, + "learning_rate": 1.742789925269859e-05, + "loss": 0.1341, + "step": 30155 + }, + { + "epoch": 2.95, + "learning_rate": 1.742374757818987e-05, + "loss": 0.1161, + "step": 30160 + }, + { + "epoch": 2.95, + "learning_rate": 1.741959590368115e-05, + "loss": 0.1003, + "step": 30165 + }, + { + "epoch": 2.95, + "learning_rate": 1.7415444229172434e-05, + "loss": 0.1063, + "step": 30170 + }, + { + "epoch": 2.95, + "learning_rate": 1.7411292554663715e-05, + "loss": 0.12, + "step": 30175 + }, + { + "epoch": 2.95, + "learning_rate": 1.7407140880154996e-05, + "loss": 0.1114, + "step": 30180 + }, + { + "epoch": 2.95, + "learning_rate": 1.7402989205646277e-05, + "loss": 0.1165, + "step": 30185 + }, + { + "epoch": 2.95, + "learning_rate": 1.739883753113756e-05, + "loss": 0.1518, + "step": 30190 + }, + { + "epoch": 2.95, + "learning_rate": 1.739468585662884e-05, + "loss": 0.1038, + "step": 30195 + }, + { + "epoch": 2.95, + "learning_rate": 1.7390534182120122e-05, + "loss": 0.1119, + "step": 30200 + }, + { + "epoch": 2.95, + "learning_rate": 1.7386382507611403e-05, + "loss": 0.1379, + "step": 30205 + }, + { + "epoch": 2.95, + "learning_rate": 1.7382230833102684e-05, + "loss": 0.1212, + "step": 30210 + }, + { + "epoch": 2.95, + "learning_rate": 1.7378079158593968e-05, + "loss": 0.0987, + "step": 30215 + }, + { + "epoch": 2.96, + "learning_rate": 1.737392748408525e-05, + "loss": 0.1209, + "step": 30220 + }, + { + "epoch": 2.96, + "learning_rate": 1.736977580957653e-05, + "loss": 0.1195, + "step": 30225 + }, + { + "epoch": 2.96, + "learning_rate": 1.736562413506781e-05, + "loss": 0.1067, + "step": 30230 + }, + { + "epoch": 2.96, + "learning_rate": 1.736147246055909e-05, + "loss": 0.1015, + "step": 30235 + }, + { + "epoch": 2.96, + "learning_rate": 1.7357320786050375e-05, + "loss": 0.1407, + "step": 30240 + }, + { + "epoch": 2.96, + "learning_rate": 1.7353169111541656e-05, + "loss": 0.1052, + "step": 30245 + }, + { + "epoch": 2.96, + "learning_rate": 1.7349017437032937e-05, + "loss": 0.1137, + "step": 30250 + }, + { + "epoch": 2.96, + "learning_rate": 1.734486576252422e-05, + "loss": 0.1148, + "step": 30255 + }, + { + "epoch": 2.96, + "learning_rate": 1.73407140880155e-05, + "loss": 0.1138, + "step": 30260 + }, + { + "epoch": 2.96, + "learning_rate": 1.7336562413506782e-05, + "loss": 0.0864, + "step": 30265 + }, + { + "epoch": 2.96, + "learning_rate": 1.7332410738998063e-05, + "loss": 0.1133, + "step": 30270 + }, + { + "epoch": 2.96, + "learning_rate": 1.7328259064489344e-05, + "loss": 0.1362, + "step": 30275 + }, + { + "epoch": 2.96, + "learning_rate": 1.7324107389980625e-05, + "loss": 0.1063, + "step": 30280 + }, + { + "epoch": 2.96, + "learning_rate": 1.7319955715471906e-05, + "loss": 0.1193, + "step": 30285 + }, + { + "epoch": 2.96, + "learning_rate": 1.7315804040963186e-05, + "loss": 0.1315, + "step": 30290 + }, + { + "epoch": 2.96, + "learning_rate": 1.731165236645447e-05, + "loss": 0.1063, + "step": 30295 + }, + { + "epoch": 2.96, + "learning_rate": 1.7307500691945755e-05, + "loss": 0.1172, + "step": 30300 + }, + { + "epoch": 2.96, + "learning_rate": 1.7303349017437035e-05, + "loss": 0.1534, + "step": 30305 + }, + { + "epoch": 2.96, + "learning_rate": 1.7299197342928316e-05, + "loss": 0.1119, + "step": 30310 + }, + { + "epoch": 2.96, + "learning_rate": 1.7295045668419597e-05, + "loss": 0.1038, + "step": 30315 + }, + { + "epoch": 2.96, + "learning_rate": 1.7290893993910878e-05, + "loss": 0.1157, + "step": 30320 + }, + { + "epoch": 2.97, + "learning_rate": 1.728674231940216e-05, + "loss": 0.1302, + "step": 30325 + }, + { + "epoch": 2.97, + "learning_rate": 1.728259064489344e-05, + "loss": 0.1013, + "step": 30330 + }, + { + "epoch": 2.97, + "learning_rate": 1.727843897038472e-05, + "loss": 0.1354, + "step": 30335 + }, + { + "epoch": 2.97, + "learning_rate": 1.7274287295876e-05, + "loss": 0.1434, + "step": 30340 + }, + { + "epoch": 2.97, + "learning_rate": 1.7270135621367288e-05, + "loss": 0.1129, + "step": 30345 + }, + { + "epoch": 2.97, + "learning_rate": 1.726598394685857e-05, + "loss": 0.1108, + "step": 30350 + }, + { + "epoch": 2.97, + "learning_rate": 1.726183227234985e-05, + "loss": 0.1106, + "step": 30355 + }, + { + "epoch": 2.97, + "learning_rate": 1.725768059784113e-05, + "loss": 0.1153, + "step": 30360 + }, + { + "epoch": 2.97, + "learning_rate": 1.725352892333241e-05, + "loss": 0.1122, + "step": 30365 + }, + { + "epoch": 2.97, + "learning_rate": 1.7249377248823692e-05, + "loss": 0.1224, + "step": 30370 + }, + { + "epoch": 2.97, + "learning_rate": 1.7245225574314973e-05, + "loss": 0.1251, + "step": 30375 + }, + { + "epoch": 2.97, + "learning_rate": 1.7241073899806254e-05, + "loss": 0.0997, + "step": 30380 + }, + { + "epoch": 2.97, + "learning_rate": 1.7236922225297534e-05, + "loss": 0.1021, + "step": 30385 + }, + { + "epoch": 2.97, + "learning_rate": 1.723277055078882e-05, + "loss": 0.1332, + "step": 30390 + }, + { + "epoch": 2.97, + "learning_rate": 1.7228618876280103e-05, + "loss": 0.1075, + "step": 30395 + }, + { + "epoch": 2.97, + "learning_rate": 1.7224467201771384e-05, + "loss": 0.1136, + "step": 30400 + }, + { + "epoch": 2.97, + "learning_rate": 1.7220315527262664e-05, + "loss": 0.1309, + "step": 30405 + }, + { + "epoch": 2.97, + "learning_rate": 1.7216163852753945e-05, + "loss": 0.1133, + "step": 30410 + }, + { + "epoch": 2.97, + "learning_rate": 1.7212012178245226e-05, + "loss": 0.1285, + "step": 30415 + }, + { + "epoch": 2.97, + "learning_rate": 1.7207860503736507e-05, + "loss": 0.1101, + "step": 30420 + }, + { + "epoch": 2.98, + "learning_rate": 1.7203708829227787e-05, + "loss": 0.1476, + "step": 30425 + }, + { + "epoch": 2.98, + "learning_rate": 1.7199557154719068e-05, + "loss": 0.0989, + "step": 30430 + }, + { + "epoch": 2.98, + "learning_rate": 1.7195405480210352e-05, + "loss": 0.1031, + "step": 30435 + }, + { + "epoch": 2.98, + "learning_rate": 1.7191253805701633e-05, + "loss": 0.143, + "step": 30440 + }, + { + "epoch": 2.98, + "learning_rate": 1.7187102131192917e-05, + "loss": 0.1079, + "step": 30445 + }, + { + "epoch": 2.98, + "learning_rate": 1.7182950456684198e-05, + "loss": 0.1221, + "step": 30450 + }, + { + "epoch": 2.98, + "learning_rate": 1.717879878217548e-05, + "loss": 0.1181, + "step": 30455 + }, + { + "epoch": 2.98, + "learning_rate": 1.717464710766676e-05, + "loss": 0.1091, + "step": 30460 + }, + { + "epoch": 2.98, + "learning_rate": 1.717049543315804e-05, + "loss": 0.0991, + "step": 30465 + }, + { + "epoch": 2.98, + "learning_rate": 1.716634375864932e-05, + "loss": 0.1076, + "step": 30470 + }, + { + "epoch": 2.98, + "learning_rate": 1.7162192084140605e-05, + "loss": 0.1277, + "step": 30475 + }, + { + "epoch": 2.98, + "learning_rate": 1.7158040409631886e-05, + "loss": 0.1158, + "step": 30480 + }, + { + "epoch": 2.98, + "learning_rate": 1.7153888735123167e-05, + "loss": 0.1188, + "step": 30485 + }, + { + "epoch": 2.98, + "learning_rate": 1.7149737060614448e-05, + "loss": 0.1318, + "step": 30490 + }, + { + "epoch": 2.98, + "learning_rate": 1.7145585386105728e-05, + "loss": 0.1129, + "step": 30495 + }, + { + "epoch": 2.98, + "learning_rate": 1.7141433711597012e-05, + "loss": 0.0976, + "step": 30500 + }, + { + "epoch": 2.98, + "eval_cer": 0.059571624455743856, + "eval_loss": 0.244193896651268, + "eval_runtime": 274.299, + "eval_samples_per_second": 59.679, + "eval_steps_per_second": 1.659, + "eval_wer": 0.15199519403433392, + "step": 30500 + }, + { + "epoch": 2.98, + "learning_rate": 1.7137282037088293e-05, + "loss": 0.1406, + "step": 30505 + }, + { + "epoch": 2.98, + "learning_rate": 1.7133130362579574e-05, + "loss": 0.1229, + "step": 30510 + }, + { + "epoch": 2.98, + "learning_rate": 1.7128978688070855e-05, + "loss": 0.1079, + "step": 30515 + }, + { + "epoch": 2.98, + "learning_rate": 1.712482701356214e-05, + "loss": 0.1146, + "step": 30520 + }, + { + "epoch": 2.98, + "learning_rate": 1.712067533905342e-05, + "loss": 0.1135, + "step": 30525 + }, + { + "epoch": 2.99, + "learning_rate": 1.71165236645447e-05, + "loss": 0.1132, + "step": 30530 + }, + { + "epoch": 2.99, + "learning_rate": 1.711237199003598e-05, + "loss": 0.111, + "step": 30535 + }, + { + "epoch": 2.99, + "learning_rate": 1.7108220315527262e-05, + "loss": 0.1209, + "step": 30540 + }, + { + "epoch": 2.99, + "learning_rate": 1.7104068641018543e-05, + "loss": 0.0941, + "step": 30545 + }, + { + "epoch": 2.99, + "learning_rate": 1.7099916966509827e-05, + "loss": 0.1214, + "step": 30550 + }, + { + "epoch": 2.99, + "learning_rate": 1.7095765292001108e-05, + "loss": 0.1177, + "step": 30555 + }, + { + "epoch": 2.99, + "learning_rate": 1.709161361749239e-05, + "loss": 0.11, + "step": 30560 + }, + { + "epoch": 2.99, + "learning_rate": 1.7087461942983673e-05, + "loss": 0.1063, + "step": 30565 + }, + { + "epoch": 2.99, + "learning_rate": 1.7083310268474953e-05, + "loss": 0.1169, + "step": 30570 + }, + { + "epoch": 2.99, + "learning_rate": 1.7079158593966234e-05, + "loss": 0.1236, + "step": 30575 + }, + { + "epoch": 2.99, + "learning_rate": 1.7075006919457515e-05, + "loss": 0.1153, + "step": 30580 + }, + { + "epoch": 2.99, + "learning_rate": 1.7070855244948796e-05, + "loss": 0.116, + "step": 30585 + }, + { + "epoch": 2.99, + "learning_rate": 1.7066703570440076e-05, + "loss": 0.1377, + "step": 30590 + }, + { + "epoch": 2.99, + "learning_rate": 1.7062551895931357e-05, + "loss": 0.1204, + "step": 30595 + }, + { + "epoch": 2.99, + "learning_rate": 1.705840022142264e-05, + "loss": 0.1032, + "step": 30600 + }, + { + "epoch": 2.99, + "learning_rate": 1.7054248546913922e-05, + "loss": 0.1481, + "step": 30605 + }, + { + "epoch": 2.99, + "learning_rate": 1.7050096872405206e-05, + "loss": 0.1154, + "step": 30610 + }, + { + "epoch": 2.99, + "learning_rate": 1.7045945197896487e-05, + "loss": 0.1217, + "step": 30615 + }, + { + "epoch": 2.99, + "learning_rate": 1.7041793523387768e-05, + "loss": 0.1226, + "step": 30620 + }, + { + "epoch": 2.99, + "learning_rate": 1.703764184887905e-05, + "loss": 0.1231, + "step": 30625 + }, + { + "epoch": 3.0, + "learning_rate": 1.703349017437033e-05, + "loss": 0.1041, + "step": 30630 + }, + { + "epoch": 3.0, + "learning_rate": 1.702933849986161e-05, + "loss": 0.1235, + "step": 30635 + }, + { + "epoch": 3.0, + "learning_rate": 1.702518682535289e-05, + "loss": 0.1393, + "step": 30640 + }, + { + "epoch": 3.0, + "learning_rate": 1.702103515084417e-05, + "loss": 0.1112, + "step": 30645 + }, + { + "epoch": 3.0, + "learning_rate": 1.7016883476335456e-05, + "loss": 0.1122, + "step": 30650 + }, + { + "epoch": 3.0, + "learning_rate": 1.701273180182674e-05, + "loss": 0.1289, + "step": 30655 + }, + { + "epoch": 3.0, + "learning_rate": 1.700858012731802e-05, + "loss": 0.1151, + "step": 30660 + }, + { + "epoch": 3.0, + "learning_rate": 1.70044284528093e-05, + "loss": 0.1085, + "step": 30665 + }, + { + "epoch": 3.0, + "learning_rate": 1.7000276778300582e-05, + "loss": 0.1355, + "step": 30670 + }, + { + "epoch": 3.0, + "learning_rate": 1.6996125103791863e-05, + "loss": 0.1094, + "step": 30675 + }, + { + "epoch": 3.0, + "learning_rate": 1.6991973429283144e-05, + "loss": 0.12, + "step": 30680 + }, + { + "epoch": 3.0, + "learning_rate": 1.6987821754774425e-05, + "loss": 0.1269, + "step": 30685 + }, + { + "epoch": 3.0, + "learning_rate": 1.6983670080265705e-05, + "loss": 0.0999, + "step": 30690 + }, + { + "epoch": 3.0, + "learning_rate": 1.6979518405756986e-05, + "loss": 0.1142, + "step": 30695 + }, + { + "epoch": 3.0, + "learning_rate": 1.697536673124827e-05, + "loss": 0.1214, + "step": 30700 + }, + { + "epoch": 3.0, + "learning_rate": 1.6971215056739554e-05, + "loss": 0.0962, + "step": 30705 + }, + { + "epoch": 3.0, + "learning_rate": 1.6967063382230835e-05, + "loss": 0.124, + "step": 30710 + }, + { + "epoch": 3.0, + "learning_rate": 1.6962911707722116e-05, + "loss": 0.1196, + "step": 30715 + }, + { + "epoch": 3.0, + "learning_rate": 1.6958760033213397e-05, + "loss": 0.1113, + "step": 30720 + }, + { + "epoch": 3.0, + "learning_rate": 1.6954608358704678e-05, + "loss": 0.1007, + "step": 30725 + }, + { + "epoch": 3.0, + "learning_rate": 1.6950456684195958e-05, + "loss": 0.1041, + "step": 30730 + }, + { + "epoch": 3.01, + "learning_rate": 1.694630500968724e-05, + "loss": 0.1096, + "step": 30735 + }, + { + "epoch": 3.01, + "learning_rate": 1.6942153335178523e-05, + "loss": 0.1037, + "step": 30740 + }, + { + "epoch": 3.01, + "learning_rate": 1.6938001660669804e-05, + "loss": 0.0888, + "step": 30745 + }, + { + "epoch": 3.01, + "learning_rate": 1.6933849986161085e-05, + "loss": 0.1069, + "step": 30750 + }, + { + "epoch": 3.01, + "learning_rate": 1.692969831165237e-05, + "loss": 0.1117, + "step": 30755 + }, + { + "epoch": 3.01, + "learning_rate": 1.692554663714365e-05, + "loss": 0.1054, + "step": 30760 + }, + { + "epoch": 3.01, + "learning_rate": 1.692139496263493e-05, + "loss": 0.1517, + "step": 30765 + }, + { + "epoch": 3.01, + "learning_rate": 1.691724328812621e-05, + "loss": 0.1011, + "step": 30770 + }, + { + "epoch": 3.01, + "learning_rate": 1.6913091613617492e-05, + "loss": 0.1018, + "step": 30775 + }, + { + "epoch": 3.01, + "learning_rate": 1.6908939939108773e-05, + "loss": 0.1, + "step": 30780 + }, + { + "epoch": 3.01, + "learning_rate": 1.6904788264600057e-05, + "loss": 0.1183, + "step": 30785 + }, + { + "epoch": 3.01, + "learning_rate": 1.6900636590091338e-05, + "loss": 0.1029, + "step": 30790 + }, + { + "epoch": 3.01, + "learning_rate": 1.689648491558262e-05, + "loss": 0.1074, + "step": 30795 + }, + { + "epoch": 3.01, + "learning_rate": 1.68923332410739e-05, + "loss": 0.1261, + "step": 30800 + }, + { + "epoch": 3.01, + "learning_rate": 1.6888181566565183e-05, + "loss": 0.1095, + "step": 30805 + }, + { + "epoch": 3.01, + "learning_rate": 1.6884029892056464e-05, + "loss": 0.1007, + "step": 30810 + }, + { + "epoch": 3.01, + "learning_rate": 1.6879878217547745e-05, + "loss": 0.1237, + "step": 30815 + }, + { + "epoch": 3.01, + "learning_rate": 1.6875726543039026e-05, + "loss": 0.1158, + "step": 30820 + }, + { + "epoch": 3.01, + "learning_rate": 1.6871574868530306e-05, + "loss": 0.0965, + "step": 30825 + }, + { + "epoch": 3.01, + "learning_rate": 1.686742319402159e-05, + "loss": 0.0951, + "step": 30830 + }, + { + "epoch": 3.02, + "learning_rate": 1.686327151951287e-05, + "loss": 0.1189, + "step": 30835 + }, + { + "epoch": 3.02, + "learning_rate": 1.6859119845004152e-05, + "loss": 0.1051, + "step": 30840 + }, + { + "epoch": 3.02, + "learning_rate": 1.6854968170495433e-05, + "loss": 0.1035, + "step": 30845 + }, + { + "epoch": 3.02, + "learning_rate": 1.6850816495986714e-05, + "loss": 0.1243, + "step": 30850 + }, + { + "epoch": 3.02, + "learning_rate": 1.6846664821477998e-05, + "loss": 0.1106, + "step": 30855 + }, + { + "epoch": 3.02, + "learning_rate": 1.684251314696928e-05, + "loss": 0.0965, + "step": 30860 + }, + { + "epoch": 3.02, + "learning_rate": 1.683836147246056e-05, + "loss": 0.134, + "step": 30865 + }, + { + "epoch": 3.02, + "learning_rate": 1.683420979795184e-05, + "loss": 0.107, + "step": 30870 + }, + { + "epoch": 3.02, + "learning_rate": 1.6830058123443124e-05, + "loss": 0.0918, + "step": 30875 + }, + { + "epoch": 3.02, + "learning_rate": 1.6825906448934405e-05, + "loss": 0.1063, + "step": 30880 + }, + { + "epoch": 3.02, + "learning_rate": 1.6821754774425686e-05, + "loss": 0.1285, + "step": 30885 + }, + { + "epoch": 3.02, + "learning_rate": 1.6817603099916967e-05, + "loss": 0.1013, + "step": 30890 + }, + { + "epoch": 3.02, + "learning_rate": 1.6813451425408247e-05, + "loss": 0.1129, + "step": 30895 + }, + { + "epoch": 3.02, + "learning_rate": 1.6809299750899528e-05, + "loss": 0.1221, + "step": 30900 + }, + { + "epoch": 3.02, + "learning_rate": 1.680514807639081e-05, + "loss": 0.1006, + "step": 30905 + }, + { + "epoch": 3.02, + "learning_rate": 1.6800996401882093e-05, + "loss": 0.0957, + "step": 30910 + }, + { + "epoch": 3.02, + "learning_rate": 1.6796844727373374e-05, + "loss": 0.1189, + "step": 30915 + }, + { + "epoch": 3.02, + "learning_rate": 1.6792693052864658e-05, + "loss": 0.1064, + "step": 30920 + }, + { + "epoch": 3.02, + "learning_rate": 1.678854137835594e-05, + "loss": 0.1084, + "step": 30925 + }, + { + "epoch": 3.02, + "learning_rate": 1.678438970384722e-05, + "loss": 0.1213, + "step": 30930 + }, + { + "epoch": 3.02, + "learning_rate": 1.67802380293385e-05, + "loss": 0.1148, + "step": 30935 + }, + { + "epoch": 3.03, + "learning_rate": 1.677608635482978e-05, + "loss": 0.1038, + "step": 30940 + }, + { + "epoch": 3.03, + "learning_rate": 1.6771934680321062e-05, + "loss": 0.1101, + "step": 30945 + }, + { + "epoch": 3.03, + "learning_rate": 1.6767783005812343e-05, + "loss": 0.1211, + "step": 30950 + }, + { + "epoch": 3.03, + "learning_rate": 1.6763631331303623e-05, + "loss": 0.1096, + "step": 30955 + }, + { + "epoch": 3.03, + "learning_rate": 1.675947965679491e-05, + "loss": 0.0976, + "step": 30960 + }, + { + "epoch": 3.03, + "learning_rate": 1.675532798228619e-05, + "loss": 0.1162, + "step": 30965 + }, + { + "epoch": 3.03, + "learning_rate": 1.6751176307777472e-05, + "loss": 0.1043, + "step": 30970 + }, + { + "epoch": 3.03, + "learning_rate": 1.6747024633268753e-05, + "loss": 0.1138, + "step": 30975 + }, + { + "epoch": 3.03, + "learning_rate": 1.6742872958760034e-05, + "loss": 0.1046, + "step": 30980 + }, + { + "epoch": 3.03, + "learning_rate": 1.6738721284251315e-05, + "loss": 0.124, + "step": 30985 + }, + { + "epoch": 3.03, + "learning_rate": 1.6734569609742595e-05, + "loss": 0.1077, + "step": 30990 + }, + { + "epoch": 3.03, + "learning_rate": 1.6730417935233876e-05, + "loss": 0.1015, + "step": 30995 + }, + { + "epoch": 3.03, + "learning_rate": 1.6726266260725157e-05, + "loss": 0.1422, + "step": 31000 + }, + { + "epoch": 3.03, + "eval_cer": 0.05879931833579593, + "eval_loss": 0.239752858877182, + "eval_runtime": 274.4878, + "eval_samples_per_second": 59.638, + "eval_steps_per_second": 1.658, + "eval_wer": 0.1502647852007601, + "step": 31000 + }, + { + "epoch": 3.03, + "learning_rate": 1.672211458621644e-05, + "loss": 0.1064, + "step": 31005 + }, + { + "epoch": 3.03, + "learning_rate": 1.6717962911707725e-05, + "loss": 0.0944, + "step": 31010 + }, + { + "epoch": 3.03, + "learning_rate": 1.6713811237199006e-05, + "loss": 0.1093, + "step": 31015 + }, + { + "epoch": 3.03, + "learning_rate": 1.6709659562690287e-05, + "loss": 0.1188, + "step": 31020 + }, + { + "epoch": 3.03, + "learning_rate": 1.6705507888181568e-05, + "loss": 0.0959, + "step": 31025 + }, + { + "epoch": 3.03, + "learning_rate": 1.670135621367285e-05, + "loss": 0.1072, + "step": 31030 + }, + { + "epoch": 3.03, + "learning_rate": 1.669720453916413e-05, + "loss": 0.1168, + "step": 31035 + }, + { + "epoch": 3.04, + "learning_rate": 1.669305286465541e-05, + "loss": 0.103, + "step": 31040 + }, + { + "epoch": 3.04, + "learning_rate": 1.668890119014669e-05, + "loss": 0.1056, + "step": 31045 + }, + { + "epoch": 3.04, + "learning_rate": 1.6684749515637975e-05, + "loss": 0.1268, + "step": 31050 + }, + { + "epoch": 3.04, + "learning_rate": 1.6680597841129256e-05, + "loss": 0.1032, + "step": 31055 + }, + { + "epoch": 3.04, + "learning_rate": 1.6676446166620536e-05, + "loss": 0.1115, + "step": 31060 + }, + { + "epoch": 3.04, + "learning_rate": 1.667229449211182e-05, + "loss": 0.1164, + "step": 31065 + }, + { + "epoch": 3.04, + "learning_rate": 1.66681428176031e-05, + "loss": 0.1008, + "step": 31070 + }, + { + "epoch": 3.04, + "learning_rate": 1.6663991143094382e-05, + "loss": 0.109, + "step": 31075 + }, + { + "epoch": 3.04, + "learning_rate": 1.6659839468585663e-05, + "loss": 0.1168, + "step": 31080 + }, + { + "epoch": 3.04, + "learning_rate": 1.6655687794076944e-05, + "loss": 0.1166, + "step": 31085 + }, + { + "epoch": 3.04, + "learning_rate": 1.6651536119568224e-05, + "loss": 0.1051, + "step": 31090 + }, + { + "epoch": 3.04, + "learning_rate": 1.664738444505951e-05, + "loss": 0.104, + "step": 31095 + }, + { + "epoch": 3.04, + "learning_rate": 1.664323277055079e-05, + "loss": 0.1183, + "step": 31100 + }, + { + "epoch": 3.04, + "learning_rate": 1.663908109604207e-05, + "loss": 0.0933, + "step": 31105 + }, + { + "epoch": 3.04, + "learning_rate": 1.663492942153335e-05, + "loss": 0.0979, + "step": 31110 + }, + { + "epoch": 3.04, + "learning_rate": 1.6630777747024635e-05, + "loss": 0.1271, + "step": 31115 + }, + { + "epoch": 3.04, + "learning_rate": 1.6626626072515916e-05, + "loss": 0.1218, + "step": 31120 + }, + { + "epoch": 3.04, + "learning_rate": 1.6622474398007197e-05, + "loss": 0.0973, + "step": 31125 + }, + { + "epoch": 3.04, + "learning_rate": 1.6618322723498477e-05, + "loss": 0.106, + "step": 31130 + }, + { + "epoch": 3.04, + "learning_rate": 1.6614171048989758e-05, + "loss": 0.1162, + "step": 31135 + }, + { + "epoch": 3.04, + "learning_rate": 1.6610019374481042e-05, + "loss": 0.0967, + "step": 31140 + }, + { + "epoch": 3.05, + "learning_rate": 1.6605867699972323e-05, + "loss": 0.095, + "step": 31145 + }, + { + "epoch": 3.05, + "learning_rate": 1.6601716025463604e-05, + "loss": 0.118, + "step": 31150 + }, + { + "epoch": 3.05, + "learning_rate": 1.6597564350954885e-05, + "loss": 0.1101, + "step": 31155 + }, + { + "epoch": 3.05, + "learning_rate": 1.6593412676446165e-05, + "loss": 0.0925, + "step": 31160 + }, + { + "epoch": 3.05, + "learning_rate": 1.658926100193745e-05, + "loss": 0.1327, + "step": 31165 + }, + { + "epoch": 3.05, + "learning_rate": 1.658510932742873e-05, + "loss": 0.1054, + "step": 31170 + }, + { + "epoch": 3.05, + "learning_rate": 1.658095765292001e-05, + "loss": 0.1071, + "step": 31175 + }, + { + "epoch": 3.05, + "learning_rate": 1.6576805978411295e-05, + "loss": 0.1215, + "step": 31180 + }, + { + "epoch": 3.05, + "learning_rate": 1.6572654303902576e-05, + "loss": 0.1239, + "step": 31185 + }, + { + "epoch": 3.05, + "learning_rate": 1.6568502629393857e-05, + "loss": 0.0872, + "step": 31190 + }, + { + "epoch": 3.05, + "learning_rate": 1.6564350954885137e-05, + "loss": 0.0978, + "step": 31195 + }, + { + "epoch": 3.05, + "learning_rate": 1.6560199280376418e-05, + "loss": 0.1177, + "step": 31200 + }, + { + "epoch": 3.05, + "learning_rate": 1.65560476058677e-05, + "loss": 0.096, + "step": 31205 + }, + { + "epoch": 3.05, + "learning_rate": 1.655189593135898e-05, + "loss": 0.0874, + "step": 31210 + }, + { + "epoch": 3.05, + "learning_rate": 1.6547744256850264e-05, + "loss": 0.1057, + "step": 31215 + }, + { + "epoch": 3.05, + "learning_rate": 1.6543592582341545e-05, + "loss": 0.1126, + "step": 31220 + }, + { + "epoch": 3.05, + "learning_rate": 1.653944090783283e-05, + "loss": 0.0945, + "step": 31225 + }, + { + "epoch": 3.05, + "learning_rate": 1.653528923332411e-05, + "loss": 0.0989, + "step": 31230 + }, + { + "epoch": 3.05, + "learning_rate": 1.653113755881539e-05, + "loss": 0.1256, + "step": 31235 + }, + { + "epoch": 3.05, + "learning_rate": 1.652698588430667e-05, + "loss": 0.0986, + "step": 31240 + }, + { + "epoch": 3.06, + "learning_rate": 1.6522834209797952e-05, + "loss": 0.0975, + "step": 31245 + }, + { + "epoch": 3.06, + "learning_rate": 1.6518682535289233e-05, + "loss": 0.1274, + "step": 31250 + }, + { + "epoch": 3.06, + "learning_rate": 1.6514530860780513e-05, + "loss": 0.0972, + "step": 31255 + }, + { + "epoch": 3.06, + "learning_rate": 1.6510379186271794e-05, + "loss": 0.0869, + "step": 31260 + }, + { + "epoch": 3.06, + "learning_rate": 1.650622751176308e-05, + "loss": 0.1136, + "step": 31265 + }, + { + "epoch": 3.06, + "learning_rate": 1.6502075837254363e-05, + "loss": 0.116, + "step": 31270 + }, + { + "epoch": 3.06, + "learning_rate": 1.6497924162745643e-05, + "loss": 0.1043, + "step": 31275 + }, + { + "epoch": 3.06, + "learning_rate": 1.6493772488236924e-05, + "loss": 0.1123, + "step": 31280 + }, + { + "epoch": 3.06, + "learning_rate": 1.6489620813728205e-05, + "loss": 0.1335, + "step": 31285 + }, + { + "epoch": 3.06, + "learning_rate": 1.6485469139219486e-05, + "loss": 0.1158, + "step": 31290 + }, + { + "epoch": 3.06, + "learning_rate": 1.6481317464710766e-05, + "loss": 0.1042, + "step": 31295 + }, + { + "epoch": 3.06, + "learning_rate": 1.6477165790202047e-05, + "loss": 0.1376, + "step": 31300 + }, + { + "epoch": 3.06, + "learning_rate": 1.6473014115693328e-05, + "loss": 0.1095, + "step": 31305 + }, + { + "epoch": 3.06, + "learning_rate": 1.646886244118461e-05, + "loss": 0.1135, + "step": 31310 + }, + { + "epoch": 3.06, + "learning_rate": 1.6464710766675893e-05, + "loss": 0.1196, + "step": 31315 + }, + { + "epoch": 3.06, + "learning_rate": 1.6460559092167177e-05, + "loss": 0.1143, + "step": 31320 + }, + { + "epoch": 3.06, + "learning_rate": 1.6456407417658458e-05, + "loss": 0.0948, + "step": 31325 + }, + { + "epoch": 3.06, + "learning_rate": 1.645225574314974e-05, + "loss": 0.0987, + "step": 31330 + }, + { + "epoch": 3.06, + "learning_rate": 1.644810406864102e-05, + "loss": 0.1223, + "step": 31335 + }, + { + "epoch": 3.06, + "learning_rate": 1.64439523941323e-05, + "loss": 0.1001, + "step": 31340 + }, + { + "epoch": 3.07, + "learning_rate": 1.643980071962358e-05, + "loss": 0.0946, + "step": 31345 + }, + { + "epoch": 3.07, + "learning_rate": 1.643564904511486e-05, + "loss": 0.1264, + "step": 31350 + }, + { + "epoch": 3.07, + "learning_rate": 1.6431497370606142e-05, + "loss": 0.105, + "step": 31355 + }, + { + "epoch": 3.07, + "learning_rate": 1.6427345696097427e-05, + "loss": 0.0953, + "step": 31360 + }, + { + "epoch": 3.07, + "learning_rate": 1.6423194021588707e-05, + "loss": 0.1278, + "step": 31365 + }, + { + "epoch": 3.07, + "learning_rate": 1.641904234707999e-05, + "loss": 0.1131, + "step": 31370 + }, + { + "epoch": 3.07, + "learning_rate": 1.6414890672571272e-05, + "loss": 0.1023, + "step": 31375 + }, + { + "epoch": 3.07, + "learning_rate": 1.6410738998062553e-05, + "loss": 0.1054, + "step": 31380 + }, + { + "epoch": 3.07, + "learning_rate": 1.6406587323553834e-05, + "loss": 0.1404, + "step": 31385 + }, + { + "epoch": 3.07, + "learning_rate": 1.6402435649045115e-05, + "loss": 0.0956, + "step": 31390 + }, + { + "epoch": 3.07, + "learning_rate": 1.6398283974536395e-05, + "loss": 0.0992, + "step": 31395 + }, + { + "epoch": 3.07, + "learning_rate": 1.6394132300027676e-05, + "loss": 0.1213, + "step": 31400 + }, + { + "epoch": 3.07, + "learning_rate": 1.638998062551896e-05, + "loss": 0.0913, + "step": 31405 + }, + { + "epoch": 3.07, + "learning_rate": 1.638582895101024e-05, + "loss": 0.1207, + "step": 31410 + }, + { + "epoch": 3.07, + "learning_rate": 1.6381677276501522e-05, + "loss": 0.1167, + "step": 31415 + }, + { + "epoch": 3.07, + "learning_rate": 1.6377525601992806e-05, + "loss": 0.1071, + "step": 31420 + }, + { + "epoch": 3.07, + "learning_rate": 1.6373373927484087e-05, + "loss": 0.1087, + "step": 31425 + }, + { + "epoch": 3.07, + "learning_rate": 1.6369222252975367e-05, + "loss": 0.1246, + "step": 31430 + }, + { + "epoch": 3.07, + "learning_rate": 1.6365070578466648e-05, + "loss": 0.1106, + "step": 31435 + }, + { + "epoch": 3.07, + "learning_rate": 1.636091890395793e-05, + "loss": 0.0979, + "step": 31440 + }, + { + "epoch": 3.07, + "learning_rate": 1.6356767229449213e-05, + "loss": 0.0939, + "step": 31445 + }, + { + "epoch": 3.08, + "learning_rate": 1.6352615554940494e-05, + "loss": 0.1041, + "step": 31450 + }, + { + "epoch": 3.08, + "learning_rate": 1.6348463880431775e-05, + "loss": 0.1109, + "step": 31455 + }, + { + "epoch": 3.08, + "learning_rate": 1.6344312205923055e-05, + "loss": 0.108, + "step": 31460 + }, + { + "epoch": 3.08, + "learning_rate": 1.6340160531414336e-05, + "loss": 0.1226, + "step": 31465 + }, + { + "epoch": 3.08, + "learning_rate": 1.633600885690562e-05, + "loss": 0.1083, + "step": 31470 + }, + { + "epoch": 3.08, + "learning_rate": 1.63318571823969e-05, + "loss": 0.118, + "step": 31475 + }, + { + "epoch": 3.08, + "learning_rate": 1.6327705507888182e-05, + "loss": 0.1106, + "step": 31480 + }, + { + "epoch": 3.08, + "learning_rate": 1.6323553833379463e-05, + "loss": 0.1203, + "step": 31485 + }, + { + "epoch": 3.08, + "learning_rate": 1.6319402158870747e-05, + "loss": 0.1125, + "step": 31490 + }, + { + "epoch": 3.08, + "learning_rate": 1.6315250484362028e-05, + "loss": 0.0932, + "step": 31495 + }, + { + "epoch": 3.08, + "learning_rate": 1.631109880985331e-05, + "loss": 0.1285, + "step": 31500 + }, + { + "epoch": 3.08, + "eval_cer": 0.05906060753206573, + "eval_loss": 0.24463200569152832, + "eval_runtime": 277.0934, + "eval_samples_per_second": 59.078, + "eval_steps_per_second": 1.642, + "eval_wer": 0.15180582853933905, + "step": 31500 + }, + { + "epoch": 3.08, + "learning_rate": 1.630694713534459e-05, + "loss": 0.1032, + "step": 31505 + }, + { + "epoch": 3.08, + "learning_rate": 1.630279546083587e-05, + "loss": 0.1016, + "step": 31510 + }, + { + "epoch": 3.08, + "learning_rate": 1.629864378632715e-05, + "loss": 0.1305, + "step": 31515 + }, + { + "epoch": 3.08, + "learning_rate": 1.629449211181843e-05, + "loss": 0.1222, + "step": 31520 + }, + { + "epoch": 3.08, + "learning_rate": 1.6290340437309716e-05, + "loss": 0.094, + "step": 31525 + }, + { + "epoch": 3.08, + "learning_rate": 1.6286188762800996e-05, + "loss": 0.1017, + "step": 31530 + }, + { + "epoch": 3.08, + "learning_rate": 1.628203708829228e-05, + "loss": 0.123, + "step": 31535 + }, + { + "epoch": 3.08, + "learning_rate": 1.627788541378356e-05, + "loss": 0.1258, + "step": 31540 + }, + { + "epoch": 3.08, + "learning_rate": 1.6273733739274842e-05, + "loss": 0.1032, + "step": 31545 + }, + { + "epoch": 3.09, + "learning_rate": 1.6269582064766123e-05, + "loss": 0.1232, + "step": 31550 + }, + { + "epoch": 3.09, + "learning_rate": 1.6265430390257404e-05, + "loss": 0.1052, + "step": 31555 + }, + { + "epoch": 3.09, + "learning_rate": 1.6261278715748684e-05, + "loss": 0.1034, + "step": 31560 + }, + { + "epoch": 3.09, + "learning_rate": 1.6257127041239965e-05, + "loss": 0.1483, + "step": 31565 + }, + { + "epoch": 3.09, + "learning_rate": 1.6252975366731246e-05, + "loss": 0.1072, + "step": 31570 + }, + { + "epoch": 3.09, + "learning_rate": 1.624882369222253e-05, + "loss": 0.1113, + "step": 31575 + }, + { + "epoch": 3.09, + "learning_rate": 1.6244672017713814e-05, + "loss": 0.1204, + "step": 31580 + }, + { + "epoch": 3.09, + "learning_rate": 1.6240520343205095e-05, + "loss": 0.127, + "step": 31585 + }, + { + "epoch": 3.09, + "learning_rate": 1.6236368668696376e-05, + "loss": 0.111, + "step": 31590 + }, + { + "epoch": 3.09, + "learning_rate": 1.6232216994187657e-05, + "loss": 0.1089, + "step": 31595 + }, + { + "epoch": 3.09, + "learning_rate": 1.6228065319678937e-05, + "loss": 0.1207, + "step": 31600 + }, + { + "epoch": 3.09, + "learning_rate": 1.6223913645170218e-05, + "loss": 0.1146, + "step": 31605 + }, + { + "epoch": 3.09, + "learning_rate": 1.62197619706615e-05, + "loss": 0.096, + "step": 31610 + }, + { + "epoch": 3.09, + "learning_rate": 1.621561029615278e-05, + "loss": 0.1208, + "step": 31615 + }, + { + "epoch": 3.09, + "learning_rate": 1.621145862164406e-05, + "loss": 0.1136, + "step": 31620 + }, + { + "epoch": 3.09, + "learning_rate": 1.6207306947135348e-05, + "loss": 0.0989, + "step": 31625 + }, + { + "epoch": 3.09, + "learning_rate": 1.620315527262663e-05, + "loss": 0.0985, + "step": 31630 + }, + { + "epoch": 3.09, + "learning_rate": 1.619900359811791e-05, + "loss": 0.121, + "step": 31635 + }, + { + "epoch": 3.09, + "learning_rate": 1.619485192360919e-05, + "loss": 0.1095, + "step": 31640 + }, + { + "epoch": 3.09, + "learning_rate": 1.619070024910047e-05, + "loss": 0.0926, + "step": 31645 + }, + { + "epoch": 3.09, + "learning_rate": 1.6186548574591752e-05, + "loss": 0.1283, + "step": 31650 + }, + { + "epoch": 3.1, + "learning_rate": 1.6182396900083033e-05, + "loss": 0.1034, + "step": 31655 + }, + { + "epoch": 3.1, + "learning_rate": 1.6178245225574313e-05, + "loss": 0.1059, + "step": 31660 + }, + { + "epoch": 3.1, + "learning_rate": 1.6174093551065597e-05, + "loss": 0.114, + "step": 31665 + }, + { + "epoch": 3.1, + "learning_rate": 1.6169941876556878e-05, + "loss": 0.0994, + "step": 31670 + }, + { + "epoch": 3.1, + "learning_rate": 1.616579020204816e-05, + "loss": 0.123, + "step": 31675 + }, + { + "epoch": 3.1, + "learning_rate": 1.6161638527539443e-05, + "loss": 0.1002, + "step": 31680 + }, + { + "epoch": 3.1, + "learning_rate": 1.6157486853030724e-05, + "loss": 0.1137, + "step": 31685 + }, + { + "epoch": 3.1, + "learning_rate": 1.6153335178522005e-05, + "loss": 0.0932, + "step": 31690 + }, + { + "epoch": 3.1, + "learning_rate": 1.6149183504013285e-05, + "loss": 0.0959, + "step": 31695 + }, + { + "epoch": 3.1, + "learning_rate": 1.6145031829504566e-05, + "loss": 0.1227, + "step": 31700 + }, + { + "epoch": 3.1, + "learning_rate": 1.6140880154995847e-05, + "loss": 0.123, + "step": 31705 + }, + { + "epoch": 3.1, + "learning_rate": 1.613672848048713e-05, + "loss": 0.1037, + "step": 31710 + }, + { + "epoch": 3.1, + "learning_rate": 1.6132576805978412e-05, + "loss": 0.1145, + "step": 31715 + }, + { + "epoch": 3.1, + "learning_rate": 1.6128425131469693e-05, + "loss": 0.1001, + "step": 31720 + }, + { + "epoch": 3.1, + "learning_rate": 1.6124273456960973e-05, + "loss": 0.0986, + "step": 31725 + }, + { + "epoch": 3.1, + "learning_rate": 1.6120121782452258e-05, + "loss": 0.0994, + "step": 31730 + }, + { + "epoch": 3.1, + "learning_rate": 1.611597010794354e-05, + "loss": 0.1239, + "step": 31735 + }, + { + "epoch": 3.1, + "learning_rate": 1.611181843343482e-05, + "loss": 0.1039, + "step": 31740 + }, + { + "epoch": 3.1, + "learning_rate": 1.61076667589261e-05, + "loss": 0.1021, + "step": 31745 + }, + { + "epoch": 3.1, + "learning_rate": 1.610351508441738e-05, + "loss": 0.1392, + "step": 31750 + }, + { + "epoch": 3.11, + "learning_rate": 1.6099363409908665e-05, + "loss": 0.1046, + "step": 31755 + }, + { + "epoch": 3.11, + "learning_rate": 1.6095211735399946e-05, + "loss": 0.1012, + "step": 31760 + }, + { + "epoch": 3.11, + "learning_rate": 1.6091060060891226e-05, + "loss": 0.1206, + "step": 31765 + }, + { + "epoch": 3.11, + "learning_rate": 1.6086908386382507e-05, + "loss": 0.1092, + "step": 31770 + }, + { + "epoch": 3.11, + "learning_rate": 1.6082756711873788e-05, + "loss": 0.1016, + "step": 31775 + }, + { + "epoch": 3.11, + "learning_rate": 1.6078605037365072e-05, + "loss": 0.1015, + "step": 31780 + }, + { + "epoch": 3.11, + "learning_rate": 1.6074453362856353e-05, + "loss": 0.1185, + "step": 31785 + }, + { + "epoch": 3.11, + "learning_rate": 1.6070301688347634e-05, + "loss": 0.0929, + "step": 31790 + }, + { + "epoch": 3.11, + "learning_rate": 1.6066150013838914e-05, + "loss": 0.0969, + "step": 31795 + }, + { + "epoch": 3.11, + "learning_rate": 1.60619983393302e-05, + "loss": 0.1368, + "step": 31800 + }, + { + "epoch": 3.11, + "learning_rate": 1.605784666482148e-05, + "loss": 0.1012, + "step": 31805 + }, + { + "epoch": 3.11, + "learning_rate": 1.605369499031276e-05, + "loss": 0.098, + "step": 31810 + }, + { + "epoch": 3.11, + "learning_rate": 1.604954331580404e-05, + "loss": 0.1213, + "step": 31815 + }, + { + "epoch": 3.11, + "learning_rate": 1.604539164129532e-05, + "loss": 0.1114, + "step": 31820 + }, + { + "epoch": 3.11, + "learning_rate": 1.6041239966786602e-05, + "loss": 0.1047, + "step": 31825 + }, + { + "epoch": 3.11, + "learning_rate": 1.6037088292277887e-05, + "loss": 0.1089, + "step": 31830 + }, + { + "epoch": 3.11, + "learning_rate": 1.6032936617769167e-05, + "loss": 0.11, + "step": 31835 + }, + { + "epoch": 3.11, + "learning_rate": 1.6028784943260448e-05, + "loss": 0.1018, + "step": 31840 + }, + { + "epoch": 3.11, + "learning_rate": 1.6024633268751732e-05, + "loss": 0.1078, + "step": 31845 + }, + { + "epoch": 3.11, + "learning_rate": 1.6020481594243013e-05, + "loss": 0.1311, + "step": 31850 + }, + { + "epoch": 3.11, + "learning_rate": 1.6016329919734294e-05, + "loss": 0.1034, + "step": 31855 + }, + { + "epoch": 3.12, + "learning_rate": 1.6012178245225575e-05, + "loss": 0.0991, + "step": 31860 + }, + { + "epoch": 3.12, + "learning_rate": 1.6008026570716855e-05, + "loss": 0.1105, + "step": 31865 + }, + { + "epoch": 3.12, + "learning_rate": 1.6003874896208136e-05, + "loss": 0.0927, + "step": 31870 + }, + { + "epoch": 3.12, + "learning_rate": 1.5999723221699417e-05, + "loss": 0.0943, + "step": 31875 + }, + { + "epoch": 3.12, + "learning_rate": 1.59955715471907e-05, + "loss": 0.099, + "step": 31880 + }, + { + "epoch": 3.12, + "learning_rate": 1.5991419872681985e-05, + "loss": 0.1252, + "step": 31885 + }, + { + "epoch": 3.12, + "learning_rate": 1.5987268198173266e-05, + "loss": 0.1082, + "step": 31890 + }, + { + "epoch": 3.12, + "learning_rate": 1.5983116523664547e-05, + "loss": 0.1061, + "step": 31895 + }, + { + "epoch": 3.12, + "learning_rate": 1.5978964849155827e-05, + "loss": 0.1184, + "step": 31900 + }, + { + "epoch": 3.12, + "learning_rate": 1.5974813174647108e-05, + "loss": 0.1207, + "step": 31905 + }, + { + "epoch": 3.12, + "learning_rate": 1.597066150013839e-05, + "loss": 0.1004, + "step": 31910 + }, + { + "epoch": 3.12, + "learning_rate": 1.596650982562967e-05, + "loss": 0.1125, + "step": 31915 + }, + { + "epoch": 3.12, + "learning_rate": 1.596235815112095e-05, + "loss": 0.1066, + "step": 31920 + }, + { + "epoch": 3.12, + "learning_rate": 1.595820647661223e-05, + "loss": 0.0973, + "step": 31925 + }, + { + "epoch": 3.12, + "learning_rate": 1.5954054802103515e-05, + "loss": 0.113, + "step": 31930 + }, + { + "epoch": 3.12, + "learning_rate": 1.59499031275948e-05, + "loss": 0.1153, + "step": 31935 + }, + { + "epoch": 3.12, + "learning_rate": 1.594575145308608e-05, + "loss": 0.0887, + "step": 31940 + }, + { + "epoch": 3.12, + "learning_rate": 1.594159977857736e-05, + "loss": 0.108, + "step": 31945 + }, + { + "epoch": 3.12, + "learning_rate": 1.5937448104068642e-05, + "loss": 0.123, + "step": 31950 + }, + { + "epoch": 3.12, + "learning_rate": 1.5933296429559923e-05, + "loss": 0.1054, + "step": 31955 + }, + { + "epoch": 3.13, + "learning_rate": 1.5929144755051203e-05, + "loss": 0.1106, + "step": 31960 + }, + { + "epoch": 3.13, + "learning_rate": 1.5924993080542484e-05, + "loss": 0.1255, + "step": 31965 + }, + { + "epoch": 3.13, + "learning_rate": 1.5920841406033765e-05, + "loss": 0.1025, + "step": 31970 + }, + { + "epoch": 3.13, + "learning_rate": 1.591668973152505e-05, + "loss": 0.109, + "step": 31975 + }, + { + "epoch": 3.13, + "learning_rate": 1.591253805701633e-05, + "loss": 0.1225, + "step": 31980 + }, + { + "epoch": 3.13, + "learning_rate": 1.5908386382507614e-05, + "loss": 0.1262, + "step": 31985 + }, + { + "epoch": 3.13, + "learning_rate": 1.5904234707998895e-05, + "loss": 0.1043, + "step": 31990 + }, + { + "epoch": 3.13, + "learning_rate": 1.5900083033490176e-05, + "loss": 0.0945, + "step": 31995 + }, + { + "epoch": 3.13, + "learning_rate": 1.5895931358981456e-05, + "loss": 0.122, + "step": 32000 + }, + { + "epoch": 3.13, + "eval_cer": 0.058660580709457975, + "eval_loss": 0.24014343321323395, + "eval_runtime": 273.9516, + "eval_samples_per_second": 59.755, + "eval_steps_per_second": 1.661, + "eval_wer": 0.15031049411334504, + "step": 32000 + }, + { + "epoch": 3.13, + "learning_rate": 1.5891779684472737e-05, + "loss": 0.1089, + "step": 32005 + }, + { + "epoch": 3.13, + "learning_rate": 1.5887628009964018e-05, + "loss": 0.1023, + "step": 32010 + }, + { + "epoch": 3.13, + "learning_rate": 1.58834763354553e-05, + "loss": 0.1154, + "step": 32015 + }, + { + "epoch": 3.13, + "learning_rate": 1.5879324660946583e-05, + "loss": 0.1111, + "step": 32020 + }, + { + "epoch": 3.13, + "learning_rate": 1.5875172986437864e-05, + "loss": 0.0987, + "step": 32025 + }, + { + "epoch": 3.13, + "learning_rate": 1.5871021311929144e-05, + "loss": 0.117, + "step": 32030 + }, + { + "epoch": 3.13, + "learning_rate": 1.586686963742043e-05, + "loss": 0.1269, + "step": 32035 + }, + { + "epoch": 3.13, + "learning_rate": 1.586271796291171e-05, + "loss": 0.0954, + "step": 32040 + }, + { + "epoch": 3.13, + "learning_rate": 1.585856628840299e-05, + "loss": 0.1168, + "step": 32045 + }, + { + "epoch": 3.13, + "learning_rate": 1.585441461389427e-05, + "loss": 0.1232, + "step": 32050 + }, + { + "epoch": 3.13, + "learning_rate": 1.585026293938555e-05, + "loss": 0.1055, + "step": 32055 + }, + { + "epoch": 3.13, + "learning_rate": 1.5846111264876832e-05, + "loss": 0.0955, + "step": 32060 + }, + { + "epoch": 3.14, + "learning_rate": 1.5841959590368117e-05, + "loss": 0.1205, + "step": 32065 + }, + { + "epoch": 3.14, + "learning_rate": 1.5837807915859397e-05, + "loss": 0.1063, + "step": 32070 + }, + { + "epoch": 3.14, + "learning_rate": 1.5833656241350678e-05, + "loss": 0.0881, + "step": 32075 + }, + { + "epoch": 3.14, + "learning_rate": 1.582950456684196e-05, + "loss": 0.1069, + "step": 32080 + }, + { + "epoch": 3.14, + "learning_rate": 1.5825352892333243e-05, + "loss": 0.1299, + "step": 32085 + }, + { + "epoch": 3.14, + "learning_rate": 1.5821201217824524e-05, + "loss": 0.0979, + "step": 32090 + }, + { + "epoch": 3.14, + "learning_rate": 1.5817049543315805e-05, + "loss": 0.0977, + "step": 32095 + }, + { + "epoch": 3.14, + "learning_rate": 1.5812897868807085e-05, + "loss": 0.1254, + "step": 32100 + }, + { + "epoch": 3.14, + "learning_rate": 1.5808746194298366e-05, + "loss": 0.0897, + "step": 32105 + }, + { + "epoch": 3.14, + "learning_rate": 1.580459451978965e-05, + "loss": 0.1075, + "step": 32110 + }, + { + "epoch": 3.14, + "learning_rate": 1.580044284528093e-05, + "loss": 0.1189, + "step": 32115 + }, + { + "epoch": 3.14, + "learning_rate": 1.5796291170772212e-05, + "loss": 0.1049, + "step": 32120 + }, + { + "epoch": 3.14, + "learning_rate": 1.5792139496263493e-05, + "loss": 0.1141, + "step": 32125 + }, + { + "epoch": 3.14, + "learning_rate": 1.5787987821754773e-05, + "loss": 0.1111, + "step": 32130 + }, + { + "epoch": 3.14, + "learning_rate": 1.5783836147246054e-05, + "loss": 0.1045, + "step": 32135 + }, + { + "epoch": 3.14, + "learning_rate": 1.5779684472737338e-05, + "loss": 0.0953, + "step": 32140 + }, + { + "epoch": 3.14, + "learning_rate": 1.577553279822862e-05, + "loss": 0.1015, + "step": 32145 + }, + { + "epoch": 3.14, + "learning_rate": 1.5771381123719903e-05, + "loss": 0.1132, + "step": 32150 + }, + { + "epoch": 3.14, + "learning_rate": 1.5767229449211184e-05, + "loss": 0.1095, + "step": 32155 + }, + { + "epoch": 3.14, + "learning_rate": 1.5763077774702465e-05, + "loss": 0.1036, + "step": 32160 + }, + { + "epoch": 3.15, + "learning_rate": 1.5758926100193745e-05, + "loss": 0.115, + "step": 32165 + }, + { + "epoch": 3.15, + "learning_rate": 1.5754774425685026e-05, + "loss": 0.1244, + "step": 32170 + }, + { + "epoch": 3.15, + "learning_rate": 1.5750622751176307e-05, + "loss": 0.0971, + "step": 32175 + }, + { + "epoch": 3.15, + "learning_rate": 1.5746471076667588e-05, + "loss": 0.1043, + "step": 32180 + }, + { + "epoch": 3.15, + "learning_rate": 1.574231940215887e-05, + "loss": 0.1362, + "step": 32185 + }, + { + "epoch": 3.15, + "learning_rate": 1.5738167727650153e-05, + "loss": 0.1126, + "step": 32190 + }, + { + "epoch": 3.15, + "learning_rate": 1.5734016053141437e-05, + "loss": 0.0885, + "step": 32195 + }, + { + "epoch": 3.15, + "learning_rate": 1.5729864378632718e-05, + "loss": 0.1544, + "step": 32200 + }, + { + "epoch": 3.15, + "learning_rate": 1.5725712704124e-05, + "loss": 0.0904, + "step": 32205 + }, + { + "epoch": 3.15, + "learning_rate": 1.572156102961528e-05, + "loss": 0.0939, + "step": 32210 + }, + { + "epoch": 3.15, + "learning_rate": 1.571740935510656e-05, + "loss": 0.1179, + "step": 32215 + }, + { + "epoch": 3.15, + "learning_rate": 1.571325768059784e-05, + "loss": 0.1215, + "step": 32220 + }, + { + "epoch": 3.15, + "learning_rate": 1.570910600608912e-05, + "loss": 0.1013, + "step": 32225 + }, + { + "epoch": 3.15, + "learning_rate": 1.5704954331580402e-05, + "loss": 0.1026, + "step": 32230 + }, + { + "epoch": 3.15, + "learning_rate": 1.5700802657071683e-05, + "loss": 0.1263, + "step": 32235 + }, + { + "epoch": 3.15, + "learning_rate": 1.569665098256297e-05, + "loss": 0.0965, + "step": 32240 + }, + { + "epoch": 3.15, + "learning_rate": 1.569249930805425e-05, + "loss": 0.1113, + "step": 32245 + }, + { + "epoch": 3.15, + "learning_rate": 1.5688347633545532e-05, + "loss": 0.1193, + "step": 32250 + }, + { + "epoch": 3.15, + "learning_rate": 1.5684195959036813e-05, + "loss": 0.1032, + "step": 32255 + }, + { + "epoch": 3.15, + "learning_rate": 1.5680044284528094e-05, + "loss": 0.1018, + "step": 32260 + }, + { + "epoch": 3.15, + "learning_rate": 1.5675892610019374e-05, + "loss": 0.116, + "step": 32265 + }, + { + "epoch": 3.16, + "learning_rate": 1.5671740935510655e-05, + "loss": 0.1115, + "step": 32270 + }, + { + "epoch": 3.16, + "learning_rate": 1.5667589261001936e-05, + "loss": 0.1005, + "step": 32275 + }, + { + "epoch": 3.16, + "learning_rate": 1.5663437586493217e-05, + "loss": 0.0988, + "step": 32280 + }, + { + "epoch": 3.16, + "learning_rate": 1.56592859119845e-05, + "loss": 0.1261, + "step": 32285 + }, + { + "epoch": 3.16, + "learning_rate": 1.565513423747578e-05, + "loss": 0.0952, + "step": 32290 + }, + { + "epoch": 3.16, + "learning_rate": 1.5650982562967066e-05, + "loss": 0.0996, + "step": 32295 + }, + { + "epoch": 3.16, + "learning_rate": 1.5646830888458347e-05, + "loss": 0.1171, + "step": 32300 + }, + { + "epoch": 3.16, + "learning_rate": 1.5642679213949627e-05, + "loss": 0.093, + "step": 32305 + }, + { + "epoch": 3.16, + "learning_rate": 1.5638527539440908e-05, + "loss": 0.1064, + "step": 32310 + }, + { + "epoch": 3.16, + "learning_rate": 1.563437586493219e-05, + "loss": 0.1212, + "step": 32315 + }, + { + "epoch": 3.16, + "learning_rate": 1.563022419042347e-05, + "loss": 0.109, + "step": 32320 + }, + { + "epoch": 3.16, + "learning_rate": 1.562607251591475e-05, + "loss": 0.0917, + "step": 32325 + }, + { + "epoch": 3.16, + "learning_rate": 1.5621920841406035e-05, + "loss": 0.098, + "step": 32330 + }, + { + "epoch": 3.16, + "learning_rate": 1.5617769166897315e-05, + "loss": 0.1311, + "step": 32335 + }, + { + "epoch": 3.16, + "learning_rate": 1.5613617492388596e-05, + "loss": 0.1087, + "step": 32340 + }, + { + "epoch": 3.16, + "learning_rate": 1.560946581787988e-05, + "loss": 0.1, + "step": 32345 + }, + { + "epoch": 3.16, + "learning_rate": 1.560531414337116e-05, + "loss": 0.1319, + "step": 32350 + }, + { + "epoch": 3.16, + "learning_rate": 1.5601162468862442e-05, + "loss": 0.0886, + "step": 32355 + }, + { + "epoch": 3.16, + "learning_rate": 1.5597010794353723e-05, + "loss": 0.1002, + "step": 32360 + }, + { + "epoch": 3.16, + "learning_rate": 1.5592859119845003e-05, + "loss": 0.1444, + "step": 32365 + }, + { + "epoch": 3.17, + "learning_rate": 1.5588707445336287e-05, + "loss": 0.114, + "step": 32370 + }, + { + "epoch": 3.17, + "learning_rate": 1.5584555770827568e-05, + "loss": 0.0992, + "step": 32375 + }, + { + "epoch": 3.17, + "learning_rate": 1.558040409631885e-05, + "loss": 0.1072, + "step": 32380 + }, + { + "epoch": 3.17, + "learning_rate": 1.557625242181013e-05, + "loss": 0.1335, + "step": 32385 + }, + { + "epoch": 3.17, + "learning_rate": 1.557210074730141e-05, + "loss": 0.1019, + "step": 32390 + }, + { + "epoch": 3.17, + "learning_rate": 1.5567949072792695e-05, + "loss": 0.0989, + "step": 32395 + }, + { + "epoch": 3.17, + "learning_rate": 1.5563797398283975e-05, + "loss": 0.1349, + "step": 32400 + }, + { + "epoch": 3.17, + "learning_rate": 1.5559645723775256e-05, + "loss": 0.096, + "step": 32405 + }, + { + "epoch": 3.17, + "learning_rate": 1.5555494049266537e-05, + "loss": 0.0941, + "step": 32410 + }, + { + "epoch": 3.17, + "learning_rate": 1.555134237475782e-05, + "loss": 0.1207, + "step": 32415 + }, + { + "epoch": 3.17, + "learning_rate": 1.5547190700249102e-05, + "loss": 0.1114, + "step": 32420 + }, + { + "epoch": 3.17, + "learning_rate": 1.5543039025740383e-05, + "loss": 0.1043, + "step": 32425 + }, + { + "epoch": 3.17, + "learning_rate": 1.5538887351231663e-05, + "loss": 0.0925, + "step": 32430 + }, + { + "epoch": 3.17, + "learning_rate": 1.5534735676722944e-05, + "loss": 0.1211, + "step": 32435 + }, + { + "epoch": 3.17, + "learning_rate": 1.5530584002214225e-05, + "loss": 0.0981, + "step": 32440 + }, + { + "epoch": 3.17, + "learning_rate": 1.552643232770551e-05, + "loss": 0.089, + "step": 32445 + }, + { + "epoch": 3.17, + "learning_rate": 1.552228065319679e-05, + "loss": 0.1232, + "step": 32450 + }, + { + "epoch": 3.17, + "learning_rate": 1.551812897868807e-05, + "loss": 0.112, + "step": 32455 + }, + { + "epoch": 3.17, + "learning_rate": 1.5513977304179355e-05, + "loss": 0.1069, + "step": 32460 + }, + { + "epoch": 3.17, + "learning_rate": 1.5509825629670636e-05, + "loss": 0.1456, + "step": 32465 + }, + { + "epoch": 3.18, + "learning_rate": 1.5505673955161916e-05, + "loss": 0.1138, + "step": 32470 + }, + { + "epoch": 3.18, + "learning_rate": 1.5501522280653197e-05, + "loss": 0.1004, + "step": 32475 + }, + { + "epoch": 3.18, + "learning_rate": 1.5497370606144478e-05, + "loss": 0.109, + "step": 32480 + }, + { + "epoch": 3.18, + "learning_rate": 1.549321893163576e-05, + "loss": 0.1299, + "step": 32485 + }, + { + "epoch": 3.18, + "learning_rate": 1.548906725712704e-05, + "loss": 0.1052, + "step": 32490 + }, + { + "epoch": 3.18, + "learning_rate": 1.5484915582618324e-05, + "loss": 0.1053, + "step": 32495 + }, + { + "epoch": 3.18, + "learning_rate": 1.5480763908109604e-05, + "loss": 0.1132, + "step": 32500 + }, + { + "epoch": 3.18, + "eval_cer": 0.059133444785893156, + "eval_loss": 0.24367590248584747, + "eval_runtime": 279.5373, + "eval_samples_per_second": 58.561, + "eval_steps_per_second": 1.628, + "eval_wer": 0.1514205677046943, + "step": 32500 + }, + { + "epoch": 3.18, + "learning_rate": 1.547661223360089e-05, + "loss": 0.1046, + "step": 32505 + }, + { + "epoch": 3.18, + "learning_rate": 1.547246055909217e-05, + "loss": 0.0917, + "step": 32510 + }, + { + "epoch": 3.18, + "learning_rate": 1.546830888458345e-05, + "loss": 0.11, + "step": 32515 + }, + { + "epoch": 3.18, + "learning_rate": 1.546415721007473e-05, + "loss": 0.1017, + "step": 32520 + }, + { + "epoch": 3.18, + "learning_rate": 1.546000553556601e-05, + "loss": 0.0961, + "step": 32525 + }, + { + "epoch": 3.18, + "learning_rate": 1.5455853861057292e-05, + "loss": 0.0946, + "step": 32530 + }, + { + "epoch": 3.18, + "learning_rate": 1.5451702186548573e-05, + "loss": 0.1092, + "step": 32535 + }, + { + "epoch": 3.18, + "learning_rate": 1.5447550512039854e-05, + "loss": 0.0987, + "step": 32540 + }, + { + "epoch": 3.18, + "learning_rate": 1.5443398837531135e-05, + "loss": 0.1072, + "step": 32545 + }, + { + "epoch": 3.18, + "learning_rate": 1.5439247163022422e-05, + "loss": 0.1191, + "step": 32550 + }, + { + "epoch": 3.18, + "learning_rate": 1.5435095488513703e-05, + "loss": 0.1042, + "step": 32555 + }, + { + "epoch": 3.18, + "learning_rate": 1.5430943814004984e-05, + "loss": 0.099, + "step": 32560 + }, + { + "epoch": 3.18, + "learning_rate": 1.5426792139496265e-05, + "loss": 0.1055, + "step": 32565 + }, + { + "epoch": 3.18, + "learning_rate": 1.5422640464987545e-05, + "loss": 0.1084, + "step": 32570 + }, + { + "epoch": 3.19, + "learning_rate": 1.5418488790478826e-05, + "loss": 0.1031, + "step": 32575 + }, + { + "epoch": 3.19, + "learning_rate": 1.5414337115970107e-05, + "loss": 0.1059, + "step": 32580 + }, + { + "epoch": 3.19, + "learning_rate": 1.5410185441461388e-05, + "loss": 0.127, + "step": 32585 + }, + { + "epoch": 3.19, + "learning_rate": 1.5406033766952672e-05, + "loss": 0.1098, + "step": 32590 + }, + { + "epoch": 3.19, + "learning_rate": 1.5401882092443953e-05, + "loss": 0.092, + "step": 32595 + }, + { + "epoch": 3.19, + "learning_rate": 1.5397730417935237e-05, + "loss": 0.1276, + "step": 32600 + }, + { + "epoch": 3.19, + "learning_rate": 1.5393578743426517e-05, + "loss": 0.0973, + "step": 32605 + }, + { + "epoch": 3.19, + "learning_rate": 1.5389427068917798e-05, + "loss": 0.1045, + "step": 32610 + }, + { + "epoch": 3.19, + "learning_rate": 1.538527539440908e-05, + "loss": 0.1129, + "step": 32615 + }, + { + "epoch": 3.19, + "learning_rate": 1.538112371990036e-05, + "loss": 0.1012, + "step": 32620 + }, + { + "epoch": 3.19, + "learning_rate": 1.537697204539164e-05, + "loss": 0.1047, + "step": 32625 + }, + { + "epoch": 3.19, + "learning_rate": 1.537282037088292e-05, + "loss": 0.1096, + "step": 32630 + }, + { + "epoch": 3.19, + "learning_rate": 1.5368668696374205e-05, + "loss": 0.1262, + "step": 32635 + }, + { + "epoch": 3.19, + "learning_rate": 1.5364517021865486e-05, + "loss": 0.1054, + "step": 32640 + }, + { + "epoch": 3.19, + "learning_rate": 1.5360365347356767e-05, + "loss": 0.096, + "step": 32645 + }, + { + "epoch": 3.19, + "learning_rate": 1.535621367284805e-05, + "loss": 0.1323, + "step": 32650 + }, + { + "epoch": 3.19, + "learning_rate": 1.5352061998339332e-05, + "loss": 0.1099, + "step": 32655 + }, + { + "epoch": 3.19, + "learning_rate": 1.5347910323830613e-05, + "loss": 0.0824, + "step": 32660 + }, + { + "epoch": 3.19, + "learning_rate": 1.5343758649321893e-05, + "loss": 0.1057, + "step": 32665 + }, + { + "epoch": 3.19, + "learning_rate": 1.5339606974813174e-05, + "loss": 0.1215, + "step": 32670 + }, + { + "epoch": 3.2, + "learning_rate": 1.5335455300304455e-05, + "loss": 0.1031, + "step": 32675 + }, + { + "epoch": 3.2, + "learning_rate": 1.533130362579574e-05, + "loss": 0.1148, + "step": 32680 + }, + { + "epoch": 3.2, + "learning_rate": 1.532715195128702e-05, + "loss": 0.1124, + "step": 32685 + }, + { + "epoch": 3.2, + "learning_rate": 1.53230002767783e-05, + "loss": 0.1009, + "step": 32690 + }, + { + "epoch": 3.2, + "learning_rate": 1.531884860226958e-05, + "loss": 0.0963, + "step": 32695 + }, + { + "epoch": 3.2, + "learning_rate": 1.5314696927760866e-05, + "loss": 0.1228, + "step": 32700 + }, + { + "epoch": 3.2, + "learning_rate": 1.5310545253252146e-05, + "loss": 0.1046, + "step": 32705 + }, + { + "epoch": 3.2, + "learning_rate": 1.5306393578743427e-05, + "loss": 0.1028, + "step": 32710 + }, + { + "epoch": 3.2, + "learning_rate": 1.5302241904234708e-05, + "loss": 0.1189, + "step": 32715 + }, + { + "epoch": 3.2, + "learning_rate": 1.529809022972599e-05, + "loss": 0.1009, + "step": 32720 + }, + { + "epoch": 3.2, + "learning_rate": 1.5293938555217273e-05, + "loss": 0.1249, + "step": 32725 + }, + { + "epoch": 3.2, + "learning_rate": 1.5289786880708554e-05, + "loss": 0.1247, + "step": 32730 + }, + { + "epoch": 3.2, + "learning_rate": 1.5285635206199834e-05, + "loss": 0.128, + "step": 32735 + }, + { + "epoch": 3.2, + "learning_rate": 1.5281483531691115e-05, + "loss": 0.1065, + "step": 32740 + }, + { + "epoch": 3.2, + "learning_rate": 1.5277331857182396e-05, + "loss": 0.1078, + "step": 32745 + }, + { + "epoch": 3.2, + "learning_rate": 1.5273180182673677e-05, + "loss": 0.1119, + "step": 32750 + }, + { + "epoch": 3.2, + "learning_rate": 1.526902850816496e-05, + "loss": 0.1061, + "step": 32755 + }, + { + "epoch": 3.2, + "learning_rate": 1.526487683365624e-05, + "loss": 0.1001, + "step": 32760 + }, + { + "epoch": 3.2, + "learning_rate": 1.5260725159147522e-05, + "loss": 0.1042, + "step": 32765 + }, + { + "epoch": 3.2, + "learning_rate": 1.5256573484638807e-05, + "loss": 0.1153, + "step": 32770 + }, + { + "epoch": 3.2, + "learning_rate": 1.5252421810130087e-05, + "loss": 0.1088, + "step": 32775 + }, + { + "epoch": 3.21, + "learning_rate": 1.5248270135621368e-05, + "loss": 0.11, + "step": 32780 + }, + { + "epoch": 3.21, + "learning_rate": 1.5244118461112649e-05, + "loss": 0.1308, + "step": 32785 + }, + { + "epoch": 3.21, + "learning_rate": 1.5239966786603931e-05, + "loss": 0.087, + "step": 32790 + }, + { + "epoch": 3.21, + "learning_rate": 1.5235815112095212e-05, + "loss": 0.0994, + "step": 32795 + }, + { + "epoch": 3.21, + "learning_rate": 1.5231663437586493e-05, + "loss": 0.1138, + "step": 32800 + }, + { + "epoch": 3.21, + "learning_rate": 1.5227511763077774e-05, + "loss": 0.0993, + "step": 32805 + }, + { + "epoch": 3.21, + "learning_rate": 1.5223360088569054e-05, + "loss": 0.0918, + "step": 32810 + }, + { + "epoch": 3.21, + "learning_rate": 1.5219208414060339e-05, + "loss": 0.1252, + "step": 32815 + }, + { + "epoch": 3.21, + "learning_rate": 1.5215056739551621e-05, + "loss": 0.1105, + "step": 32820 + }, + { + "epoch": 3.21, + "learning_rate": 1.5210905065042902e-05, + "loss": 0.0886, + "step": 32825 + }, + { + "epoch": 3.21, + "learning_rate": 1.5206753390534183e-05, + "loss": 0.1296, + "step": 32830 + }, + { + "epoch": 3.21, + "learning_rate": 1.5202601716025463e-05, + "loss": 0.1101, + "step": 32835 + }, + { + "epoch": 3.21, + "learning_rate": 1.5198450041516744e-05, + "loss": 0.1047, + "step": 32840 + }, + { + "epoch": 3.21, + "learning_rate": 1.5194298367008027e-05, + "loss": 0.1023, + "step": 32845 + }, + { + "epoch": 3.21, + "learning_rate": 1.5190146692499307e-05, + "loss": 0.1274, + "step": 32850 + }, + { + "epoch": 3.21, + "learning_rate": 1.5185995017990591e-05, + "loss": 0.1015, + "step": 32855 + }, + { + "epoch": 3.21, + "learning_rate": 1.5181843343481872e-05, + "loss": 0.1022, + "step": 32860 + }, + { + "epoch": 3.21, + "learning_rate": 1.5177691668973153e-05, + "loss": 0.1063, + "step": 32865 + }, + { + "epoch": 3.21, + "learning_rate": 1.5173539994464435e-05, + "loss": 0.1137, + "step": 32870 + }, + { + "epoch": 3.21, + "learning_rate": 1.5169388319955716e-05, + "loss": 0.1004, + "step": 32875 + }, + { + "epoch": 3.22, + "learning_rate": 1.5165236645446997e-05, + "loss": 0.1129, + "step": 32880 + }, + { + "epoch": 3.22, + "learning_rate": 1.5161084970938278e-05, + "loss": 0.1174, + "step": 32885 + }, + { + "epoch": 3.22, + "learning_rate": 1.5156933296429559e-05, + "loss": 0.1058, + "step": 32890 + }, + { + "epoch": 3.22, + "learning_rate": 1.5152781621920841e-05, + "loss": 0.1142, + "step": 32895 + }, + { + "epoch": 3.22, + "learning_rate": 1.5148629947412125e-05, + "loss": 0.1186, + "step": 32900 + }, + { + "epoch": 3.22, + "learning_rate": 1.5144478272903406e-05, + "loss": 0.0999, + "step": 32905 + }, + { + "epoch": 3.22, + "learning_rate": 1.5140326598394687e-05, + "loss": 0.1017, + "step": 32910 + }, + { + "epoch": 3.22, + "learning_rate": 1.5136174923885967e-05, + "loss": 0.132, + "step": 32915 + }, + { + "epoch": 3.22, + "learning_rate": 1.513202324937725e-05, + "loss": 0.1005, + "step": 32920 + }, + { + "epoch": 3.22, + "learning_rate": 1.512787157486853e-05, + "loss": 0.0969, + "step": 32925 + }, + { + "epoch": 3.22, + "learning_rate": 1.5123719900359811e-05, + "loss": 0.1314, + "step": 32930 + }, + { + "epoch": 3.22, + "learning_rate": 1.5119568225851092e-05, + "loss": 0.1366, + "step": 32935 + }, + { + "epoch": 3.22, + "learning_rate": 1.5115416551342373e-05, + "loss": 0.104, + "step": 32940 + }, + { + "epoch": 3.22, + "learning_rate": 1.5111264876833659e-05, + "loss": 0.0984, + "step": 32945 + }, + { + "epoch": 3.22, + "learning_rate": 1.510711320232494e-05, + "loss": 0.1247, + "step": 32950 + }, + { + "epoch": 3.22, + "learning_rate": 1.510296152781622e-05, + "loss": 0.1249, + "step": 32955 + }, + { + "epoch": 3.22, + "learning_rate": 1.5098809853307501e-05, + "loss": 0.1123, + "step": 32960 + }, + { + "epoch": 3.22, + "learning_rate": 1.5094658178798782e-05, + "loss": 0.1234, + "step": 32965 + }, + { + "epoch": 3.22, + "learning_rate": 1.5090506504290064e-05, + "loss": 0.1162, + "step": 32970 + }, + { + "epoch": 3.22, + "learning_rate": 1.5086354829781345e-05, + "loss": 0.0927, + "step": 32975 + }, + { + "epoch": 3.22, + "learning_rate": 1.5082203155272626e-05, + "loss": 0.1196, + "step": 32980 + }, + { + "epoch": 3.23, + "learning_rate": 1.5078051480763907e-05, + "loss": 0.1139, + "step": 32985 + }, + { + "epoch": 3.23, + "learning_rate": 1.507389980625519e-05, + "loss": 0.1024, + "step": 32990 + }, + { + "epoch": 3.23, + "learning_rate": 1.5069748131746473e-05, + "loss": 0.0984, + "step": 32995 + }, + { + "epoch": 3.23, + "learning_rate": 1.5065596457237754e-05, + "loss": 0.1275, + "step": 33000 + }, + { + "epoch": 3.23, + "eval_cer": 0.05843744436043111, + "eval_loss": 0.24655936658382416, + "eval_runtime": 272.698, + "eval_samples_per_second": 60.03, + "eval_steps_per_second": 1.669, + "eval_wer": 0.14850825698856623, + "step": 33000 + }, + { + "epoch": 3.23, + "learning_rate": 1.5061444782729035e-05, + "loss": 0.1013, + "step": 33005 + }, + { + "epoch": 3.23, + "learning_rate": 1.5057293108220316e-05, + "loss": 0.0962, + "step": 33010 + }, + { + "epoch": 3.23, + "learning_rate": 1.5053141433711596e-05, + "loss": 0.1222, + "step": 33015 + }, + { + "epoch": 3.23, + "learning_rate": 1.5048989759202879e-05, + "loss": 0.1174, + "step": 33020 + }, + { + "epoch": 3.23, + "learning_rate": 1.504483808469416e-05, + "loss": 0.0932, + "step": 33025 + }, + { + "epoch": 3.23, + "learning_rate": 1.504068641018544e-05, + "loss": 0.1168, + "step": 33030 + }, + { + "epoch": 3.23, + "learning_rate": 1.5036534735676725e-05, + "loss": 0.1322, + "step": 33035 + }, + { + "epoch": 3.23, + "learning_rate": 1.5032383061168005e-05, + "loss": 0.1048, + "step": 33040 + }, + { + "epoch": 3.23, + "learning_rate": 1.5028231386659286e-05, + "loss": 0.1026, + "step": 33045 + }, + { + "epoch": 3.23, + "learning_rate": 1.5024079712150569e-05, + "loss": 0.1292, + "step": 33050 + }, + { + "epoch": 3.23, + "learning_rate": 1.501992803764185e-05, + "loss": 0.1002, + "step": 33055 + }, + { + "epoch": 3.23, + "learning_rate": 1.501577636313313e-05, + "loss": 0.0922, + "step": 33060 + }, + { + "epoch": 3.23, + "learning_rate": 1.501162468862441e-05, + "loss": 0.0967, + "step": 33065 + }, + { + "epoch": 3.23, + "learning_rate": 1.5007473014115692e-05, + "loss": 0.1102, + "step": 33070 + }, + { + "epoch": 3.23, + "learning_rate": 1.5003321339606977e-05, + "loss": 0.0992, + "step": 33075 + }, + { + "epoch": 3.23, + "learning_rate": 1.4999169665098257e-05, + "loss": 0.1181, + "step": 33080 + }, + { + "epoch": 3.24, + "learning_rate": 1.4995017990589537e-05, + "loss": 0.1193, + "step": 33085 + }, + { + "epoch": 3.24, + "learning_rate": 1.499086631608082e-05, + "loss": 0.1061, + "step": 33090 + }, + { + "epoch": 3.24, + "learning_rate": 1.49867146415721e-05, + "loss": 0.1042, + "step": 33095 + }, + { + "epoch": 3.24, + "learning_rate": 1.4982562967063383e-05, + "loss": 0.1092, + "step": 33100 + }, + { + "epoch": 3.24, + "learning_rate": 1.4978411292554664e-05, + "loss": 0.1096, + "step": 33105 + }, + { + "epoch": 3.24, + "learning_rate": 1.4974259618045946e-05, + "loss": 0.0998, + "step": 33110 + }, + { + "epoch": 3.24, + "learning_rate": 1.4970107943537227e-05, + "loss": 0.1317, + "step": 33115 + }, + { + "epoch": 3.24, + "learning_rate": 1.4965956269028508e-05, + "loss": 0.1148, + "step": 33120 + }, + { + "epoch": 3.24, + "learning_rate": 1.496180459451979e-05, + "loss": 0.0893, + "step": 33125 + }, + { + "epoch": 3.24, + "learning_rate": 1.4957652920011073e-05, + "loss": 0.0879, + "step": 33130 + }, + { + "epoch": 3.24, + "learning_rate": 1.4953501245502353e-05, + "loss": 0.1172, + "step": 33135 + }, + { + "epoch": 3.24, + "learning_rate": 1.4949349570993634e-05, + "loss": 0.091, + "step": 33140 + }, + { + "epoch": 3.24, + "learning_rate": 1.4945197896484915e-05, + "loss": 0.1181, + "step": 33145 + }, + { + "epoch": 3.24, + "learning_rate": 1.4941046221976197e-05, + "loss": 0.1351, + "step": 33150 + }, + { + "epoch": 3.24, + "learning_rate": 1.493689454746748e-05, + "loss": 0.1095, + "step": 33155 + }, + { + "epoch": 3.24, + "learning_rate": 1.493274287295876e-05, + "loss": 0.1021, + "step": 33160 + }, + { + "epoch": 3.24, + "learning_rate": 1.4928591198450041e-05, + "loss": 0.1164, + "step": 33165 + }, + { + "epoch": 3.24, + "learning_rate": 1.4924439523941322e-05, + "loss": 0.1081, + "step": 33170 + }, + { + "epoch": 3.24, + "learning_rate": 1.4920287849432606e-05, + "loss": 0.1084, + "step": 33175 + }, + { + "epoch": 3.24, + "learning_rate": 1.4916136174923887e-05, + "loss": 0.106, + "step": 33180 + }, + { + "epoch": 3.24, + "learning_rate": 1.4911984500415168e-05, + "loss": 0.1223, + "step": 33185 + }, + { + "epoch": 3.25, + "learning_rate": 1.4907832825906449e-05, + "loss": 0.0907, + "step": 33190 + }, + { + "epoch": 3.25, + "learning_rate": 1.490368115139773e-05, + "loss": 0.1087, + "step": 33195 + }, + { + "epoch": 3.25, + "learning_rate": 1.4899529476889014e-05, + "loss": 0.1108, + "step": 33200 + }, + { + "epoch": 3.25, + "learning_rate": 1.4895377802380294e-05, + "loss": 0.0995, + "step": 33205 + }, + { + "epoch": 3.25, + "learning_rate": 1.4891226127871575e-05, + "loss": 0.0833, + "step": 33210 + }, + { + "epoch": 3.25, + "learning_rate": 1.4887074453362856e-05, + "loss": 0.1293, + "step": 33215 + }, + { + "epoch": 3.25, + "learning_rate": 1.4882922778854138e-05, + "loss": 0.1041, + "step": 33220 + }, + { + "epoch": 3.25, + "learning_rate": 1.4878771104345419e-05, + "loss": 0.1211, + "step": 33225 + }, + { + "epoch": 3.25, + "learning_rate": 1.4874619429836702e-05, + "loss": 0.0909, + "step": 33230 + }, + { + "epoch": 3.25, + "learning_rate": 1.4870467755327982e-05, + "loss": 0.1348, + "step": 33235 + }, + { + "epoch": 3.25, + "learning_rate": 1.4866316080819265e-05, + "loss": 0.0988, + "step": 33240 + }, + { + "epoch": 3.25, + "learning_rate": 1.4862164406310546e-05, + "loss": 0.106, + "step": 33245 + }, + { + "epoch": 3.25, + "learning_rate": 1.4858012731801826e-05, + "loss": 0.1246, + "step": 33250 + }, + { + "epoch": 3.25, + "learning_rate": 1.4853861057293109e-05, + "loss": 0.0962, + "step": 33255 + }, + { + "epoch": 3.25, + "learning_rate": 1.484970938278439e-05, + "loss": 0.1193, + "step": 33260 + }, + { + "epoch": 3.25, + "learning_rate": 1.4845557708275672e-05, + "loss": 0.1189, + "step": 33265 + }, + { + "epoch": 3.25, + "learning_rate": 1.4841406033766953e-05, + "loss": 0.1082, + "step": 33270 + }, + { + "epoch": 3.25, + "learning_rate": 1.4837254359258234e-05, + "loss": 0.0994, + "step": 33275 + }, + { + "epoch": 3.25, + "learning_rate": 1.4833102684749516e-05, + "loss": 0.1065, + "step": 33280 + }, + { + "epoch": 3.25, + "learning_rate": 1.4828951010240799e-05, + "loss": 0.1118, + "step": 33285 + }, + { + "epoch": 3.26, + "learning_rate": 1.482479933573208e-05, + "loss": 0.0938, + "step": 33290 + }, + { + "epoch": 3.26, + "learning_rate": 1.482064766122336e-05, + "loss": 0.094, + "step": 33295 + }, + { + "epoch": 3.26, + "learning_rate": 1.481649598671464e-05, + "loss": 0.1281, + "step": 33300 + }, + { + "epoch": 3.26, + "learning_rate": 1.4812344312205923e-05, + "loss": 0.0975, + "step": 33305 + }, + { + "epoch": 3.26, + "learning_rate": 1.4808192637697206e-05, + "loss": 0.0917, + "step": 33310 + }, + { + "epoch": 3.26, + "learning_rate": 1.4804040963188487e-05, + "loss": 0.1226, + "step": 33315 + }, + { + "epoch": 3.26, + "learning_rate": 1.4799889288679767e-05, + "loss": 0.1091, + "step": 33320 + }, + { + "epoch": 3.26, + "learning_rate": 1.4795737614171048e-05, + "loss": 0.1055, + "step": 33325 + }, + { + "epoch": 3.26, + "learning_rate": 1.4791585939662332e-05, + "loss": 0.1219, + "step": 33330 + }, + { + "epoch": 3.26, + "learning_rate": 1.4787434265153613e-05, + "loss": 0.1342, + "step": 33335 + }, + { + "epoch": 3.26, + "learning_rate": 1.4783282590644894e-05, + "loss": 0.1145, + "step": 33340 + }, + { + "epoch": 3.26, + "learning_rate": 1.4779130916136175e-05, + "loss": 0.1054, + "step": 33345 + }, + { + "epoch": 3.26, + "learning_rate": 1.4774979241627457e-05, + "loss": 0.1341, + "step": 33350 + }, + { + "epoch": 3.26, + "learning_rate": 1.477082756711874e-05, + "loss": 0.1088, + "step": 33355 + }, + { + "epoch": 3.26, + "learning_rate": 1.476667589261002e-05, + "loss": 0.0924, + "step": 33360 + }, + { + "epoch": 3.26, + "learning_rate": 1.4762524218101301e-05, + "loss": 0.1167, + "step": 33365 + }, + { + "epoch": 3.26, + "learning_rate": 1.4758372543592582e-05, + "loss": 0.1137, + "step": 33370 + }, + { + "epoch": 3.26, + "learning_rate": 1.4754220869083864e-05, + "loss": 0.1166, + "step": 33375 + }, + { + "epoch": 3.26, + "learning_rate": 1.4750069194575147e-05, + "loss": 0.1037, + "step": 33380 + }, + { + "epoch": 3.26, + "learning_rate": 1.4745917520066427e-05, + "loss": 0.1265, + "step": 33385 + }, + { + "epoch": 3.26, + "learning_rate": 1.4741765845557708e-05, + "loss": 0.1014, + "step": 33390 + }, + { + "epoch": 3.27, + "learning_rate": 1.473761417104899e-05, + "loss": 0.1065, + "step": 33395 + }, + { + "epoch": 3.27, + "learning_rate": 1.4733462496540271e-05, + "loss": 0.1231, + "step": 33400 + }, + { + "epoch": 3.27, + "learning_rate": 1.4729310822031554e-05, + "loss": 0.0985, + "step": 33405 + }, + { + "epoch": 3.27, + "learning_rate": 1.4725159147522835e-05, + "loss": 0.1071, + "step": 33410 + }, + { + "epoch": 3.27, + "learning_rate": 1.4721007473014115e-05, + "loss": 0.1092, + "step": 33415 + }, + { + "epoch": 3.27, + "learning_rate": 1.4716855798505398e-05, + "loss": 0.1078, + "step": 33420 + }, + { + "epoch": 3.27, + "learning_rate": 1.4712704123996679e-05, + "loss": 0.092, + "step": 33425 + }, + { + "epoch": 3.27, + "learning_rate": 1.4708552449487961e-05, + "loss": 0.1059, + "step": 33430 + }, + { + "epoch": 3.27, + "learning_rate": 1.4704400774979242e-05, + "loss": 0.1226, + "step": 33435 + }, + { + "epoch": 3.27, + "learning_rate": 1.4700249100470524e-05, + "loss": 0.1107, + "step": 33440 + }, + { + "epoch": 3.27, + "learning_rate": 1.4696097425961805e-05, + "loss": 0.1093, + "step": 33445 + }, + { + "epoch": 3.27, + "learning_rate": 1.4691945751453086e-05, + "loss": 0.1225, + "step": 33450 + }, + { + "epoch": 3.27, + "learning_rate": 1.4687794076944367e-05, + "loss": 0.112, + "step": 33455 + }, + { + "epoch": 3.27, + "learning_rate": 1.4683642402435649e-05, + "loss": 0.0943, + "step": 33460 + }, + { + "epoch": 3.27, + "learning_rate": 1.4679490727926932e-05, + "loss": 0.1041, + "step": 33465 + }, + { + "epoch": 3.27, + "learning_rate": 1.4675339053418212e-05, + "loss": 0.1144, + "step": 33470 + }, + { + "epoch": 3.27, + "learning_rate": 1.4671187378909493e-05, + "loss": 0.0878, + "step": 33475 + }, + { + "epoch": 3.27, + "learning_rate": 1.4667035704400774e-05, + "loss": 0.1262, + "step": 33480 + }, + { + "epoch": 3.27, + "learning_rate": 1.4662884029892058e-05, + "loss": 0.1174, + "step": 33485 + }, + { + "epoch": 3.27, + "learning_rate": 1.4658732355383339e-05, + "loss": 0.1074, + "step": 33490 + }, + { + "epoch": 3.28, + "learning_rate": 1.465458068087462e-05, + "loss": 0.0961, + "step": 33495 + }, + { + "epoch": 3.28, + "learning_rate": 1.46504290063659e-05, + "loss": 0.1299, + "step": 33500 + }, + { + "epoch": 3.28, + "eval_cer": 0.05714024755417126, + "eval_loss": 0.23801226913928986, + "eval_runtime": 274.0675, + "eval_samples_per_second": 59.73, + "eval_steps_per_second": 1.66, + "eval_wer": 0.1463272888737977, + "step": 33500 + }, + { + "epoch": 3.28, + "learning_rate": 1.4646277331857183e-05, + "loss": 0.1066, + "step": 33505 + }, + { + "epoch": 3.28, + "learning_rate": 1.4642125657348465e-05, + "loss": 0.0906, + "step": 33510 + }, + { + "epoch": 3.28, + "learning_rate": 1.4637973982839746e-05, + "loss": 0.1232, + "step": 33515 + }, + { + "epoch": 3.28, + "learning_rate": 1.4633822308331027e-05, + "loss": 0.104, + "step": 33520 + }, + { + "epoch": 3.28, + "learning_rate": 1.4629670633822308e-05, + "loss": 0.0905, + "step": 33525 + }, + { + "epoch": 3.28, + "learning_rate": 1.462551895931359e-05, + "loss": 0.0972, + "step": 33530 + }, + { + "epoch": 3.28, + "learning_rate": 1.4621367284804873e-05, + "loss": 0.118, + "step": 33535 + }, + { + "epoch": 3.28, + "learning_rate": 1.4617215610296153e-05, + "loss": 0.0923, + "step": 33540 + }, + { + "epoch": 3.28, + "learning_rate": 1.4613063935787434e-05, + "loss": 0.0979, + "step": 33545 + }, + { + "epoch": 3.28, + "learning_rate": 1.4608912261278717e-05, + "loss": 0.1342, + "step": 33550 + }, + { + "epoch": 3.28, + "learning_rate": 1.4604760586769997e-05, + "loss": 0.1011, + "step": 33555 + }, + { + "epoch": 3.28, + "learning_rate": 1.460060891226128e-05, + "loss": 0.1071, + "step": 33560 + }, + { + "epoch": 3.28, + "learning_rate": 1.459645723775256e-05, + "loss": 0.1076, + "step": 33565 + }, + { + "epoch": 3.28, + "learning_rate": 1.4592305563243841e-05, + "loss": 0.1153, + "step": 33570 + }, + { + "epoch": 3.28, + "learning_rate": 1.4588153888735124e-05, + "loss": 0.087, + "step": 33575 + }, + { + "epoch": 3.28, + "learning_rate": 1.4584002214226405e-05, + "loss": 0.1037, + "step": 33580 + }, + { + "epoch": 3.28, + "learning_rate": 1.4579850539717687e-05, + "loss": 0.1165, + "step": 33585 + }, + { + "epoch": 3.28, + "learning_rate": 1.4575698865208968e-05, + "loss": 0.0931, + "step": 33590 + }, + { + "epoch": 3.29, + "learning_rate": 1.457154719070025e-05, + "loss": 0.1255, + "step": 33595 + }, + { + "epoch": 3.29, + "learning_rate": 1.4567395516191531e-05, + "loss": 0.1213, + "step": 33600 + }, + { + "epoch": 3.29, + "learning_rate": 1.4563243841682812e-05, + "loss": 0.0981, + "step": 33605 + }, + { + "epoch": 3.29, + "learning_rate": 1.4559092167174094e-05, + "loss": 0.0974, + "step": 33610 + }, + { + "epoch": 3.29, + "learning_rate": 1.4554940492665377e-05, + "loss": 0.1068, + "step": 33615 + }, + { + "epoch": 3.29, + "learning_rate": 1.4550788818156657e-05, + "loss": 0.1073, + "step": 33620 + }, + { + "epoch": 3.29, + "learning_rate": 1.4546637143647938e-05, + "loss": 0.097, + "step": 33625 + }, + { + "epoch": 3.29, + "learning_rate": 1.4542485469139219e-05, + "loss": 0.092, + "step": 33630 + }, + { + "epoch": 3.29, + "learning_rate": 1.4538333794630501e-05, + "loss": 0.1379, + "step": 33635 + }, + { + "epoch": 3.29, + "learning_rate": 1.4534182120121784e-05, + "loss": 0.0974, + "step": 33640 + }, + { + "epoch": 3.29, + "learning_rate": 1.4530030445613065e-05, + "loss": 0.1148, + "step": 33645 + }, + { + "epoch": 3.29, + "learning_rate": 1.4525878771104345e-05, + "loss": 0.1273, + "step": 33650 + }, + { + "epoch": 3.29, + "learning_rate": 1.4521727096595626e-05, + "loss": 0.1072, + "step": 33655 + }, + { + "epoch": 3.29, + "learning_rate": 1.4517575422086909e-05, + "loss": 0.1015, + "step": 33660 + }, + { + "epoch": 3.29, + "learning_rate": 1.4513423747578191e-05, + "loss": 0.1178, + "step": 33665 + }, + { + "epoch": 3.29, + "learning_rate": 1.4509272073069472e-05, + "loss": 0.1231, + "step": 33670 + }, + { + "epoch": 3.29, + "learning_rate": 1.4505120398560753e-05, + "loss": 0.1072, + "step": 33675 + }, + { + "epoch": 3.29, + "learning_rate": 1.4500968724052033e-05, + "loss": 0.1062, + "step": 33680 + }, + { + "epoch": 3.29, + "learning_rate": 1.4496817049543316e-05, + "loss": 0.1237, + "step": 33685 + }, + { + "epoch": 3.29, + "learning_rate": 1.4492665375034598e-05, + "loss": 0.0944, + "step": 33690 + }, + { + "epoch": 3.29, + "learning_rate": 1.4488513700525879e-05, + "loss": 0.0945, + "step": 33695 + }, + { + "epoch": 3.3, + "learning_rate": 1.448436202601716e-05, + "loss": 0.1285, + "step": 33700 + }, + { + "epoch": 3.3, + "learning_rate": 1.4480210351508442e-05, + "loss": 0.0983, + "step": 33705 + }, + { + "epoch": 3.3, + "learning_rate": 1.4476058676999723e-05, + "loss": 0.0859, + "step": 33710 + }, + { + "epoch": 3.3, + "learning_rate": 1.4471907002491006e-05, + "loss": 0.1108, + "step": 33715 + }, + { + "epoch": 3.3, + "learning_rate": 1.4467755327982286e-05, + "loss": 0.1131, + "step": 33720 + }, + { + "epoch": 3.3, + "learning_rate": 1.4463603653473569e-05, + "loss": 0.1038, + "step": 33725 + }, + { + "epoch": 3.3, + "learning_rate": 1.445945197896485e-05, + "loss": 0.1156, + "step": 33730 + }, + { + "epoch": 3.3, + "learning_rate": 1.445530030445613e-05, + "loss": 0.1206, + "step": 33735 + }, + { + "epoch": 3.3, + "learning_rate": 1.4451148629947413e-05, + "loss": 0.0993, + "step": 33740 + }, + { + "epoch": 3.3, + "learning_rate": 1.4446996955438694e-05, + "loss": 0.1067, + "step": 33745 + }, + { + "epoch": 3.3, + "learning_rate": 1.4442845280929976e-05, + "loss": 0.1319, + "step": 33750 + }, + { + "epoch": 3.3, + "learning_rate": 1.4438693606421257e-05, + "loss": 0.117, + "step": 33755 + }, + { + "epoch": 3.3, + "learning_rate": 1.4434541931912538e-05, + "loss": 0.1154, + "step": 33760 + }, + { + "epoch": 3.3, + "learning_rate": 1.443039025740382e-05, + "loss": 0.1294, + "step": 33765 + }, + { + "epoch": 3.3, + "learning_rate": 1.4427068917796845e-05, + "loss": 0.1078, + "step": 33770 + }, + { + "epoch": 3.3, + "learning_rate": 1.4422917243288127e-05, + "loss": 0.0935, + "step": 33775 + }, + { + "epoch": 3.3, + "learning_rate": 1.4418765568779408e-05, + "loss": 0.1004, + "step": 33780 + }, + { + "epoch": 3.3, + "learning_rate": 1.441461389427069e-05, + "loss": 0.1133, + "step": 33785 + }, + { + "epoch": 3.3, + "learning_rate": 1.4410462219761971e-05, + "loss": 0.1036, + "step": 33790 + }, + { + "epoch": 3.3, + "learning_rate": 1.4406310545253252e-05, + "loss": 0.0901, + "step": 33795 + }, + { + "epoch": 3.31, + "learning_rate": 1.4402158870744534e-05, + "loss": 0.1261, + "step": 33800 + }, + { + "epoch": 3.31, + "learning_rate": 1.4398007196235815e-05, + "loss": 0.1042, + "step": 33805 + }, + { + "epoch": 3.31, + "learning_rate": 1.4393855521727096e-05, + "loss": 0.0916, + "step": 33810 + }, + { + "epoch": 3.31, + "learning_rate": 1.4389703847218378e-05, + "loss": 0.1009, + "step": 33815 + }, + { + "epoch": 3.31, + "learning_rate": 1.438555217270966e-05, + "loss": 0.1072, + "step": 33820 + }, + { + "epoch": 3.31, + "learning_rate": 1.4381400498200942e-05, + "loss": 0.0942, + "step": 33825 + }, + { + "epoch": 3.31, + "learning_rate": 1.4377248823692222e-05, + "loss": 0.116, + "step": 33830 + }, + { + "epoch": 3.31, + "learning_rate": 1.4373097149183503e-05, + "loss": 0.1087, + "step": 33835 + }, + { + "epoch": 3.31, + "learning_rate": 1.4368945474674786e-05, + "loss": 0.1068, + "step": 33840 + }, + { + "epoch": 3.31, + "learning_rate": 1.4364793800166068e-05, + "loss": 0.1021, + "step": 33845 + }, + { + "epoch": 3.31, + "learning_rate": 1.4360642125657349e-05, + "loss": 0.1094, + "step": 33850 + }, + { + "epoch": 3.31, + "learning_rate": 1.435649045114863e-05, + "loss": 0.0913, + "step": 33855 + }, + { + "epoch": 3.31, + "learning_rate": 1.435233877663991e-05, + "loss": 0.0954, + "step": 33860 + }, + { + "epoch": 3.31, + "learning_rate": 1.4348187102131195e-05, + "loss": 0.1294, + "step": 33865 + }, + { + "epoch": 3.31, + "learning_rate": 1.4344035427622475e-05, + "loss": 0.1159, + "step": 33870 + }, + { + "epoch": 3.31, + "learning_rate": 1.4339883753113756e-05, + "loss": 0.1016, + "step": 33875 + }, + { + "epoch": 3.31, + "learning_rate": 1.4335732078605037e-05, + "loss": 0.1071, + "step": 33880 + }, + { + "epoch": 3.31, + "learning_rate": 1.433158040409632e-05, + "loss": 0.1135, + "step": 33885 + }, + { + "epoch": 3.31, + "learning_rate": 1.4327428729587602e-05, + "loss": 0.0947, + "step": 33890 + }, + { + "epoch": 3.31, + "learning_rate": 1.4323277055078883e-05, + "loss": 0.0998, + "step": 33895 + }, + { + "epoch": 3.31, + "learning_rate": 1.4319125380570163e-05, + "loss": 0.1076, + "step": 33900 + }, + { + "epoch": 3.32, + "learning_rate": 1.4314973706061444e-05, + "loss": 0.0983, + "step": 33905 + }, + { + "epoch": 3.32, + "learning_rate": 1.4310822031552727e-05, + "loss": 0.1097, + "step": 33910 + }, + { + "epoch": 3.32, + "learning_rate": 1.4306670357044009e-05, + "loss": 0.1144, + "step": 33915 + }, + { + "epoch": 3.32, + "learning_rate": 1.430251868253529e-05, + "loss": 0.1035, + "step": 33920 + }, + { + "epoch": 3.32, + "learning_rate": 1.429836700802657e-05, + "loss": 0.1046, + "step": 33925 + }, + { + "epoch": 3.32, + "learning_rate": 1.4294215333517853e-05, + "loss": 0.1026, + "step": 33930 + }, + { + "epoch": 3.32, + "learning_rate": 1.4290063659009134e-05, + "loss": 0.1258, + "step": 33935 + }, + { + "epoch": 3.32, + "learning_rate": 1.4285911984500416e-05, + "loss": 0.1105, + "step": 33940 + }, + { + "epoch": 3.32, + "learning_rate": 1.4281760309991697e-05, + "loss": 0.1032, + "step": 33945 + }, + { + "epoch": 3.32, + "learning_rate": 1.4277608635482978e-05, + "loss": 0.1064, + "step": 33950 + }, + { + "epoch": 3.32, + "learning_rate": 1.427345696097426e-05, + "loss": 0.0997, + "step": 33955 + }, + { + "epoch": 3.32, + "learning_rate": 1.4269305286465541e-05, + "loss": 0.0918, + "step": 33960 + }, + { + "epoch": 3.32, + "learning_rate": 1.4265153611956823e-05, + "loss": 0.1188, + "step": 33965 + }, + { + "epoch": 3.32, + "learning_rate": 1.4261001937448104e-05, + "loss": 0.1147, + "step": 33970 + }, + { + "epoch": 3.32, + "learning_rate": 1.4256850262939387e-05, + "loss": 0.0993, + "step": 33975 + }, + { + "epoch": 3.32, + "learning_rate": 1.4252698588430667e-05, + "loss": 0.1033, + "step": 33980 + }, + { + "epoch": 3.32, + "learning_rate": 1.4248546913921948e-05, + "loss": 0.1212, + "step": 33985 + }, + { + "epoch": 3.32, + "learning_rate": 1.424439523941323e-05, + "loss": 0.0982, + "step": 33990 + }, + { + "epoch": 3.32, + "learning_rate": 1.4240243564904513e-05, + "loss": 0.0929, + "step": 33995 + }, + { + "epoch": 3.32, + "learning_rate": 1.4236091890395794e-05, + "loss": 0.1129, + "step": 34000 + }, + { + "epoch": 3.32, + "eval_cer": 0.05757033419581891, + "eval_loss": 0.24162627756595612, + "eval_runtime": 271.9688, + "eval_samples_per_second": 60.191, + "eval_steps_per_second": 1.673, + "eval_wer": 0.14716310898963714, + "step": 34000 + }, + { + "epoch": 3.33, + "learning_rate": 1.4231940215887075e-05, + "loss": 0.1096, + "step": 34005 + }, + { + "epoch": 3.33, + "learning_rate": 1.4227788541378355e-05, + "loss": 0.1051, + "step": 34010 + }, + { + "epoch": 3.33, + "learning_rate": 1.4223636866869636e-05, + "loss": 0.1256, + "step": 34015 + }, + { + "epoch": 3.33, + "learning_rate": 1.421948519236092e-05, + "loss": 0.1014, + "step": 34020 + }, + { + "epoch": 3.33, + "learning_rate": 1.4215333517852201e-05, + "loss": 0.1007, + "step": 34025 + }, + { + "epoch": 3.33, + "learning_rate": 1.4211181843343482e-05, + "loss": 0.1019, + "step": 34030 + }, + { + "epoch": 3.33, + "learning_rate": 1.4207030168834763e-05, + "loss": 0.115, + "step": 34035 + }, + { + "epoch": 3.33, + "learning_rate": 1.4202878494326045e-05, + "loss": 0.0953, + "step": 34040 + }, + { + "epoch": 3.33, + "learning_rate": 1.4198726819817328e-05, + "loss": 0.102, + "step": 34045 + }, + { + "epoch": 3.33, + "learning_rate": 1.4194575145308608e-05, + "loss": 0.1281, + "step": 34050 + }, + { + "epoch": 3.33, + "learning_rate": 1.4190423470799889e-05, + "loss": 0.1, + "step": 34055 + }, + { + "epoch": 3.33, + "learning_rate": 1.418627179629117e-05, + "loss": 0.0879, + "step": 34060 + }, + { + "epoch": 3.33, + "learning_rate": 1.4182120121782452e-05, + "loss": 0.1208, + "step": 34065 + }, + { + "epoch": 3.33, + "learning_rate": 1.4177968447273735e-05, + "loss": 0.1101, + "step": 34070 + }, + { + "epoch": 3.33, + "learning_rate": 1.4173816772765016e-05, + "loss": 0.0931, + "step": 34075 + }, + { + "epoch": 3.33, + "learning_rate": 1.4169665098256296e-05, + "loss": 0.1145, + "step": 34080 + }, + { + "epoch": 3.33, + "learning_rate": 1.4165513423747579e-05, + "loss": 0.1049, + "step": 34085 + }, + { + "epoch": 3.33, + "learning_rate": 1.416136174923886e-05, + "loss": 0.0905, + "step": 34090 + }, + { + "epoch": 3.33, + "learning_rate": 1.4157210074730142e-05, + "loss": 0.0997, + "step": 34095 + }, + { + "epoch": 3.33, + "learning_rate": 1.4153058400221423e-05, + "loss": 0.1117, + "step": 34100 + }, + { + "epoch": 3.33, + "learning_rate": 1.4148906725712705e-05, + "loss": 0.1153, + "step": 34105 + }, + { + "epoch": 3.34, + "learning_rate": 1.4144755051203986e-05, + "loss": 0.0982, + "step": 34110 + }, + { + "epoch": 3.34, + "learning_rate": 1.4140603376695267e-05, + "loss": 0.1419, + "step": 34115 + }, + { + "epoch": 3.34, + "learning_rate": 1.413645170218655e-05, + "loss": 0.1261, + "step": 34120 + }, + { + "epoch": 3.34, + "learning_rate": 1.413230002767783e-05, + "loss": 0.1023, + "step": 34125 + }, + { + "epoch": 3.34, + "learning_rate": 1.4128148353169113e-05, + "loss": 0.0972, + "step": 34130 + }, + { + "epoch": 3.34, + "learning_rate": 1.4123996678660393e-05, + "loss": 0.1158, + "step": 34135 + }, + { + "epoch": 3.34, + "learning_rate": 1.4119845004151674e-05, + "loss": 0.1049, + "step": 34140 + }, + { + "epoch": 3.34, + "learning_rate": 1.4115693329642957e-05, + "loss": 0.0926, + "step": 34145 + }, + { + "epoch": 3.34, + "learning_rate": 1.4111541655134239e-05, + "loss": 0.1302, + "step": 34150 + }, + { + "epoch": 3.34, + "learning_rate": 1.410738998062552e-05, + "loss": 0.1112, + "step": 34155 + }, + { + "epoch": 3.34, + "learning_rate": 1.41032383061168e-05, + "loss": 0.0891, + "step": 34160 + }, + { + "epoch": 3.34, + "learning_rate": 1.4099086631608081e-05, + "loss": 0.1224, + "step": 34165 + }, + { + "epoch": 3.34, + "learning_rate": 1.4094934957099364e-05, + "loss": 0.1097, + "step": 34170 + }, + { + "epoch": 3.34, + "learning_rate": 1.4090783282590646e-05, + "loss": 0.0848, + "step": 34175 + }, + { + "epoch": 3.34, + "learning_rate": 1.4086631608081927e-05, + "loss": 0.1136, + "step": 34180 + }, + { + "epoch": 3.34, + "learning_rate": 1.4082479933573208e-05, + "loss": 0.1223, + "step": 34185 + }, + { + "epoch": 3.34, + "learning_rate": 1.4078328259064489e-05, + "loss": 0.0973, + "step": 34190 + }, + { + "epoch": 3.34, + "learning_rate": 1.4074176584555773e-05, + "loss": 0.0979, + "step": 34195 + }, + { + "epoch": 3.34, + "learning_rate": 1.4070024910047053e-05, + "loss": 0.1201, + "step": 34200 + }, + { + "epoch": 3.34, + "learning_rate": 1.4065873235538334e-05, + "loss": 0.1015, + "step": 34205 + }, + { + "epoch": 3.35, + "learning_rate": 1.4061721561029615e-05, + "loss": 0.1009, + "step": 34210 + }, + { + "epoch": 3.35, + "learning_rate": 1.4057569886520897e-05, + "loss": 0.1083, + "step": 34215 + }, + { + "epoch": 3.35, + "learning_rate": 1.4053418212012178e-05, + "loss": 0.1056, + "step": 34220 + }, + { + "epoch": 3.35, + "learning_rate": 1.404926653750346e-05, + "loss": 0.0969, + "step": 34225 + }, + { + "epoch": 3.35, + "learning_rate": 1.4045114862994741e-05, + "loss": 0.0992, + "step": 34230 + }, + { + "epoch": 3.35, + "learning_rate": 1.4040963188486022e-05, + "loss": 0.1087, + "step": 34235 + }, + { + "epoch": 3.35, + "learning_rate": 1.4036811513977305e-05, + "loss": 0.0981, + "step": 34240 + }, + { + "epoch": 3.35, + "learning_rate": 1.4032659839468585e-05, + "loss": 0.088, + "step": 34245 + }, + { + "epoch": 3.35, + "learning_rate": 1.4028508164959868e-05, + "loss": 0.1173, + "step": 34250 + }, + { + "epoch": 3.35, + "learning_rate": 1.4024356490451149e-05, + "loss": 0.1056, + "step": 34255 + }, + { + "epoch": 3.35, + "learning_rate": 1.4020204815942431e-05, + "loss": 0.0979, + "step": 34260 + }, + { + "epoch": 3.35, + "learning_rate": 1.4016053141433712e-05, + "loss": 0.125, + "step": 34265 + }, + { + "epoch": 3.35, + "learning_rate": 1.4011901466924993e-05, + "loss": 0.0974, + "step": 34270 + }, + { + "epoch": 3.35, + "learning_rate": 1.4007749792416275e-05, + "loss": 0.095, + "step": 34275 + }, + { + "epoch": 3.35, + "learning_rate": 1.4003598117907556e-05, + "loss": 0.1012, + "step": 34280 + }, + { + "epoch": 3.35, + "learning_rate": 1.3999446443398838e-05, + "loss": 0.107, + "step": 34285 + }, + { + "epoch": 3.35, + "learning_rate": 1.3995294768890119e-05, + "loss": 0.1018, + "step": 34290 + }, + { + "epoch": 3.35, + "learning_rate": 1.39911430943814e-05, + "loss": 0.1154, + "step": 34295 + }, + { + "epoch": 3.35, + "learning_rate": 1.3986991419872682e-05, + "loss": 0.1329, + "step": 34300 + }, + { + "epoch": 3.35, + "learning_rate": 1.3982839745363965e-05, + "loss": 0.1062, + "step": 34305 + }, + { + "epoch": 3.35, + "learning_rate": 1.3978688070855246e-05, + "loss": 0.0957, + "step": 34310 + }, + { + "epoch": 3.36, + "learning_rate": 1.3974536396346526e-05, + "loss": 0.1113, + "step": 34315 + }, + { + "epoch": 3.36, + "learning_rate": 1.3970384721837807e-05, + "loss": 0.1039, + "step": 34320 + }, + { + "epoch": 3.36, + "learning_rate": 1.3966233047329091e-05, + "loss": 0.094, + "step": 34325 + }, + { + "epoch": 3.36, + "learning_rate": 1.3962081372820372e-05, + "loss": 0.1043, + "step": 34330 + }, + { + "epoch": 3.36, + "learning_rate": 1.3957929698311653e-05, + "loss": 0.1089, + "step": 34335 + }, + { + "epoch": 3.36, + "learning_rate": 1.3953778023802934e-05, + "loss": 0.1081, + "step": 34340 + }, + { + "epoch": 3.36, + "learning_rate": 1.3949626349294214e-05, + "loss": 0.1157, + "step": 34345 + }, + { + "epoch": 3.36, + "learning_rate": 1.3945474674785499e-05, + "loss": 0.1213, + "step": 34350 + }, + { + "epoch": 3.36, + "learning_rate": 1.394132300027678e-05, + "loss": 0.0996, + "step": 34355 + }, + { + "epoch": 3.36, + "learning_rate": 1.393717132576806e-05, + "loss": 0.0935, + "step": 34360 + }, + { + "epoch": 3.36, + "learning_rate": 1.393301965125934e-05, + "loss": 0.1293, + "step": 34365 + }, + { + "epoch": 3.36, + "learning_rate": 1.3928867976750623e-05, + "loss": 0.1127, + "step": 34370 + }, + { + "epoch": 3.36, + "learning_rate": 1.3924716302241906e-05, + "loss": 0.1015, + "step": 34375 + }, + { + "epoch": 3.36, + "learning_rate": 1.3920564627733187e-05, + "loss": 0.1119, + "step": 34380 + }, + { + "epoch": 3.36, + "learning_rate": 1.3916412953224467e-05, + "loss": 0.1299, + "step": 34385 + }, + { + "epoch": 3.36, + "learning_rate": 1.3912261278715748e-05, + "loss": 0.1097, + "step": 34390 + }, + { + "epoch": 3.36, + "learning_rate": 1.390810960420703e-05, + "loss": 0.1039, + "step": 34395 + }, + { + "epoch": 3.36, + "learning_rate": 1.3903957929698313e-05, + "loss": 0.1251, + "step": 34400 + }, + { + "epoch": 3.36, + "learning_rate": 1.3899806255189594e-05, + "loss": 0.1007, + "step": 34405 + }, + { + "epoch": 3.36, + "learning_rate": 1.3895654580680875e-05, + "loss": 0.0973, + "step": 34410 + }, + { + "epoch": 3.37, + "learning_rate": 1.3891502906172157e-05, + "loss": 0.1065, + "step": 34415 + }, + { + "epoch": 3.37, + "learning_rate": 1.3887351231663438e-05, + "loss": 0.0993, + "step": 34420 + }, + { + "epoch": 3.37, + "learning_rate": 1.3883199557154719e-05, + "loss": 0.1013, + "step": 34425 + }, + { + "epoch": 3.37, + "learning_rate": 1.3879047882646001e-05, + "loss": 0.1018, + "step": 34430 + }, + { + "epoch": 3.37, + "learning_rate": 1.3874896208137283e-05, + "loss": 0.1074, + "step": 34435 + }, + { + "epoch": 3.37, + "learning_rate": 1.3870744533628564e-05, + "loss": 0.0976, + "step": 34440 + }, + { + "epoch": 3.37, + "learning_rate": 1.3866592859119845e-05, + "loss": 0.0969, + "step": 34445 + }, + { + "epoch": 3.37, + "learning_rate": 1.3862441184611126e-05, + "loss": 0.1212, + "step": 34450 + }, + { + "epoch": 3.37, + "learning_rate": 1.3858289510102408e-05, + "loss": 0.1012, + "step": 34455 + }, + { + "epoch": 3.37, + "learning_rate": 1.385413783559369e-05, + "loss": 0.0961, + "step": 34460 + }, + { + "epoch": 3.37, + "learning_rate": 1.3849986161084971e-05, + "loss": 0.1083, + "step": 34465 + }, + { + "epoch": 3.37, + "learning_rate": 1.3845834486576252e-05, + "loss": 0.1104, + "step": 34470 + }, + { + "epoch": 3.37, + "learning_rate": 1.3841682812067533e-05, + "loss": 0.1138, + "step": 34475 + }, + { + "epoch": 3.37, + "learning_rate": 1.3837531137558817e-05, + "loss": 0.1041, + "step": 34480 + }, + { + "epoch": 3.37, + "learning_rate": 1.3833379463050098e-05, + "loss": 0.1079, + "step": 34485 + }, + { + "epoch": 3.37, + "learning_rate": 1.3829227788541379e-05, + "loss": 0.1014, + "step": 34490 + }, + { + "epoch": 3.37, + "learning_rate": 1.382507611403266e-05, + "loss": 0.0961, + "step": 34495 + }, + { + "epoch": 3.37, + "learning_rate": 1.382092443952394e-05, + "loss": 0.1367, + "step": 34500 + }, + { + "epoch": 3.37, + "eval_cer": 0.058144939198235254, + "eval_loss": 0.24180500209331512, + "eval_runtime": 274.3745, + "eval_samples_per_second": 59.663, + "eval_steps_per_second": 1.658, + "eval_wer": 0.14792710081427163, + "step": 34500 + }, + { + "epoch": 3.37, + "learning_rate": 1.3816772765015224e-05, + "loss": 0.096, + "step": 34505 + }, + { + "epoch": 3.37, + "learning_rate": 1.3812621090506505e-05, + "loss": 0.0966, + "step": 34510 + }, + { + "epoch": 3.38, + "learning_rate": 1.3808469415997786e-05, + "loss": 0.1103, + "step": 34515 + }, + { + "epoch": 3.38, + "learning_rate": 1.3804317741489067e-05, + "loss": 0.1033, + "step": 34520 + }, + { + "epoch": 3.38, + "learning_rate": 1.3800166066980349e-05, + "loss": 0.0972, + "step": 34525 + }, + { + "epoch": 3.38, + "learning_rate": 1.3796014392471632e-05, + "loss": 0.1146, + "step": 34530 + }, + { + "epoch": 3.38, + "learning_rate": 1.3791862717962912e-05, + "loss": 0.1195, + "step": 34535 + }, + { + "epoch": 3.38, + "learning_rate": 1.3787711043454193e-05, + "loss": 0.0868, + "step": 34540 + }, + { + "epoch": 3.38, + "learning_rate": 1.3783559368945474e-05, + "loss": 0.0854, + "step": 34545 + }, + { + "epoch": 3.38, + "learning_rate": 1.3779407694436756e-05, + "loss": 0.1257, + "step": 34550 + }, + { + "epoch": 3.38, + "learning_rate": 1.3775256019928039e-05, + "loss": 0.0962, + "step": 34555 + }, + { + "epoch": 3.38, + "learning_rate": 1.377110434541932e-05, + "loss": 0.0974, + "step": 34560 + }, + { + "epoch": 3.38, + "learning_rate": 1.37669526709106e-05, + "loss": 0.1197, + "step": 34565 + }, + { + "epoch": 3.38, + "learning_rate": 1.3762800996401883e-05, + "loss": 0.1084, + "step": 34570 + }, + { + "epoch": 3.38, + "learning_rate": 1.3758649321893164e-05, + "loss": 0.0884, + "step": 34575 + }, + { + "epoch": 3.38, + "learning_rate": 1.3754497647384446e-05, + "loss": 0.1084, + "step": 34580 + }, + { + "epoch": 3.38, + "learning_rate": 1.3750345972875727e-05, + "loss": 0.1138, + "step": 34585 + }, + { + "epoch": 3.38, + "learning_rate": 1.374619429836701e-05, + "loss": 0.1087, + "step": 34590 + }, + { + "epoch": 3.38, + "learning_rate": 1.374204262385829e-05, + "loss": 0.1037, + "step": 34595 + }, + { + "epoch": 3.38, + "learning_rate": 1.373789094934957e-05, + "loss": 0.1162, + "step": 34600 + }, + { + "epoch": 3.38, + "learning_rate": 1.3733739274840853e-05, + "loss": 0.1174, + "step": 34605 + }, + { + "epoch": 3.38, + "learning_rate": 1.3729587600332134e-05, + "loss": 0.106, + "step": 34610 + }, + { + "epoch": 3.38, + "learning_rate": 1.3725435925823417e-05, + "loss": 0.1061, + "step": 34615 + }, + { + "epoch": 3.39, + "learning_rate": 1.3721284251314697e-05, + "loss": 0.1049, + "step": 34620 + }, + { + "epoch": 3.39, + "learning_rate": 1.3717132576805978e-05, + "loss": 0.0987, + "step": 34625 + }, + { + "epoch": 3.39, + "learning_rate": 1.3712980902297259e-05, + "loss": 0.0971, + "step": 34630 + }, + { + "epoch": 3.39, + "learning_rate": 1.3708829227788543e-05, + "loss": 0.1114, + "step": 34635 + }, + { + "epoch": 3.39, + "learning_rate": 1.3704677553279824e-05, + "loss": 0.1029, + "step": 34640 + }, + { + "epoch": 3.39, + "learning_rate": 1.3700525878771105e-05, + "loss": 0.0946, + "step": 34645 + }, + { + "epoch": 3.39, + "learning_rate": 1.3696374204262385e-05, + "loss": 0.1406, + "step": 34650 + }, + { + "epoch": 3.39, + "learning_rate": 1.3692222529753666e-05, + "loss": 0.1074, + "step": 34655 + }, + { + "epoch": 3.39, + "learning_rate": 1.368807085524495e-05, + "loss": 0.0996, + "step": 34660 + }, + { + "epoch": 3.39, + "learning_rate": 1.3683919180736231e-05, + "loss": 0.1337, + "step": 34665 + }, + { + "epoch": 3.39, + "learning_rate": 1.3679767506227512e-05, + "loss": 0.1144, + "step": 34670 + }, + { + "epoch": 3.39, + "learning_rate": 1.3675615831718792e-05, + "loss": 0.1049, + "step": 34675 + }, + { + "epoch": 3.39, + "learning_rate": 1.3671464157210075e-05, + "loss": 0.1024, + "step": 34680 + }, + { + "epoch": 3.39, + "learning_rate": 1.3667312482701357e-05, + "loss": 0.1192, + "step": 34685 + }, + { + "epoch": 3.39, + "learning_rate": 1.3663160808192638e-05, + "loss": 0.1141, + "step": 34690 + }, + { + "epoch": 3.39, + "learning_rate": 1.3659009133683919e-05, + "loss": 0.095, + "step": 34695 + }, + { + "epoch": 3.39, + "learning_rate": 1.3654857459175201e-05, + "loss": 0.1195, + "step": 34700 + }, + { + "epoch": 3.39, + "learning_rate": 1.3650705784666482e-05, + "loss": 0.1067, + "step": 34705 + }, + { + "epoch": 3.39, + "learning_rate": 1.3646554110157765e-05, + "loss": 0.0933, + "step": 34710 + }, + { + "epoch": 3.39, + "learning_rate": 1.3642402435649045e-05, + "loss": 0.1113, + "step": 34715 + }, + { + "epoch": 3.4, + "learning_rate": 1.3638250761140326e-05, + "loss": 0.1192, + "step": 34720 + }, + { + "epoch": 3.4, + "learning_rate": 1.3634099086631609e-05, + "loss": 0.1038, + "step": 34725 + }, + { + "epoch": 3.4, + "learning_rate": 1.362994741212289e-05, + "loss": 0.1117, + "step": 34730 + }, + { + "epoch": 3.4, + "learning_rate": 1.3625795737614172e-05, + "loss": 0.1288, + "step": 34735 + }, + { + "epoch": 3.4, + "learning_rate": 1.3621644063105453e-05, + "loss": 0.0885, + "step": 34740 + }, + { + "epoch": 3.4, + "learning_rate": 1.3617492388596735e-05, + "loss": 0.0959, + "step": 34745 + }, + { + "epoch": 3.4, + "learning_rate": 1.3613340714088016e-05, + "loss": 0.1214, + "step": 34750 + }, + { + "epoch": 3.4, + "learning_rate": 1.3609189039579297e-05, + "loss": 0.1022, + "step": 34755 + }, + { + "epoch": 3.4, + "learning_rate": 1.3605037365070579e-05, + "loss": 0.1058, + "step": 34760 + }, + { + "epoch": 3.4, + "learning_rate": 1.360088569056186e-05, + "loss": 0.0987, + "step": 34765 + }, + { + "epoch": 3.4, + "learning_rate": 1.3596734016053142e-05, + "loss": 0.1106, + "step": 34770 + }, + { + "epoch": 3.4, + "learning_rate": 1.3592582341544423e-05, + "loss": 0.0829, + "step": 34775 + }, + { + "epoch": 3.4, + "learning_rate": 1.3588430667035704e-05, + "loss": 0.0993, + "step": 34780 + }, + { + "epoch": 3.4, + "learning_rate": 1.3584278992526986e-05, + "loss": 0.1162, + "step": 34785 + }, + { + "epoch": 3.4, + "learning_rate": 1.3580127318018269e-05, + "loss": 0.0923, + "step": 34790 + }, + { + "epoch": 3.4, + "learning_rate": 1.357597564350955e-05, + "loss": 0.0923, + "step": 34795 + }, + { + "epoch": 3.4, + "learning_rate": 1.357182396900083e-05, + "loss": 0.1166, + "step": 34800 + }, + { + "epoch": 3.4, + "learning_rate": 1.3567672294492111e-05, + "loss": 0.1097, + "step": 34805 + }, + { + "epoch": 3.4, + "learning_rate": 1.3563520619983395e-05, + "loss": 0.1041, + "step": 34810 + }, + { + "epoch": 3.4, + "learning_rate": 1.3559368945474676e-05, + "loss": 0.1246, + "step": 34815 + }, + { + "epoch": 3.4, + "learning_rate": 1.3555217270965957e-05, + "loss": 0.119, + "step": 34820 + }, + { + "epoch": 3.41, + "learning_rate": 1.3551065596457238e-05, + "loss": 0.0988, + "step": 34825 + }, + { + "epoch": 3.41, + "learning_rate": 1.3546913921948518e-05, + "loss": 0.1196, + "step": 34830 + }, + { + "epoch": 3.41, + "learning_rate": 1.35427622474398e-05, + "loss": 0.1181, + "step": 34835 + }, + { + "epoch": 3.41, + "learning_rate": 1.3538610572931083e-05, + "loss": 0.0946, + "step": 34840 + }, + { + "epoch": 3.41, + "learning_rate": 1.3534458898422364e-05, + "loss": 0.0986, + "step": 34845 + }, + { + "epoch": 3.41, + "learning_rate": 1.3530307223913645e-05, + "loss": 0.1498, + "step": 34850 + }, + { + "epoch": 3.41, + "learning_rate": 1.3526155549404927e-05, + "loss": 0.0994, + "step": 34855 + }, + { + "epoch": 3.41, + "learning_rate": 1.3522003874896208e-05, + "loss": 0.1259, + "step": 34860 + }, + { + "epoch": 3.41, + "learning_rate": 1.351785220038749e-05, + "loss": 0.1304, + "step": 34865 + }, + { + "epoch": 3.41, + "learning_rate": 1.3513700525878771e-05, + "loss": 0.1091, + "step": 34870 + }, + { + "epoch": 3.41, + "learning_rate": 1.3509548851370052e-05, + "loss": 0.0984, + "step": 34875 + }, + { + "epoch": 3.41, + "learning_rate": 1.3505397176861334e-05, + "loss": 0.1012, + "step": 34880 + }, + { + "epoch": 3.41, + "learning_rate": 1.3501245502352615e-05, + "loss": 0.1311, + "step": 34885 + }, + { + "epoch": 3.41, + "learning_rate": 1.3497093827843898e-05, + "loss": 0.0881, + "step": 34890 + }, + { + "epoch": 3.41, + "learning_rate": 1.3492942153335178e-05, + "loss": 0.0969, + "step": 34895 + }, + { + "epoch": 3.41, + "learning_rate": 1.3488790478826461e-05, + "loss": 0.1158, + "step": 34900 + }, + { + "epoch": 3.41, + "learning_rate": 1.3484638804317742e-05, + "loss": 0.0909, + "step": 34905 + }, + { + "epoch": 3.41, + "learning_rate": 1.3480487129809022e-05, + "loss": 0.0928, + "step": 34910 + }, + { + "epoch": 3.41, + "learning_rate": 1.3476335455300305e-05, + "loss": 0.1196, + "step": 34915 + }, + { + "epoch": 3.41, + "learning_rate": 1.3472183780791587e-05, + "loss": 0.1086, + "step": 34920 + }, + { + "epoch": 3.42, + "learning_rate": 1.3468032106282868e-05, + "loss": 0.1109, + "step": 34925 + }, + { + "epoch": 3.42, + "learning_rate": 1.3463880431774149e-05, + "loss": 0.1169, + "step": 34930 + }, + { + "epoch": 3.42, + "learning_rate": 1.345972875726543e-05, + "loss": 0.1204, + "step": 34935 + }, + { + "epoch": 3.42, + "learning_rate": 1.3455577082756712e-05, + "loss": 0.093, + "step": 34940 + }, + { + "epoch": 3.42, + "learning_rate": 1.3451425408247995e-05, + "loss": 0.1089, + "step": 34945 + }, + { + "epoch": 3.42, + "learning_rate": 1.3447273733739275e-05, + "loss": 0.1052, + "step": 34950 + }, + { + "epoch": 3.42, + "learning_rate": 1.3443122059230556e-05, + "loss": 0.1006, + "step": 34955 + }, + { + "epoch": 3.42, + "learning_rate": 1.3438970384721837e-05, + "loss": 0.0964, + "step": 34960 + }, + { + "epoch": 3.42, + "learning_rate": 1.3434818710213121e-05, + "loss": 0.1034, + "step": 34965 + }, + { + "epoch": 3.42, + "learning_rate": 1.3430667035704402e-05, + "loss": 0.1114, + "step": 34970 + }, + { + "epoch": 3.42, + "learning_rate": 1.3426515361195683e-05, + "loss": 0.1038, + "step": 34975 + }, + { + "epoch": 3.42, + "learning_rate": 1.3422363686686963e-05, + "loss": 0.1031, + "step": 34980 + }, + { + "epoch": 3.42, + "learning_rate": 1.3418212012178244e-05, + "loss": 0.1286, + "step": 34985 + }, + { + "epoch": 3.42, + "learning_rate": 1.3414060337669528e-05, + "loss": 0.1101, + "step": 34990 + }, + { + "epoch": 3.42, + "learning_rate": 1.3409908663160809e-05, + "loss": 0.0823, + "step": 34995 + }, + { + "epoch": 3.42, + "learning_rate": 1.340575698865209e-05, + "loss": 0.1166, + "step": 35000 + }, + { + "epoch": 3.42, + "eval_cer": 0.05725123765524162, + "eval_loss": 0.24179156124591827, + "eval_runtime": 273.4062, + "eval_samples_per_second": 59.874, + "eval_steps_per_second": 1.664, + "eval_wer": 0.14575266254415808, + "step": 35000 + }, + { + "epoch": 3.42, + "learning_rate": 1.340160531414337e-05, + "loss": 0.0932, + "step": 35005 + }, + { + "epoch": 3.42, + "learning_rate": 1.3397453639634653e-05, + "loss": 0.0889, + "step": 35010 + }, + { + "epoch": 3.42, + "learning_rate": 1.3393301965125936e-05, + "loss": 0.1184, + "step": 35015 + }, + { + "epoch": 3.42, + "learning_rate": 1.3389150290617216e-05, + "loss": 0.1057, + "step": 35020 + }, + { + "epoch": 3.42, + "learning_rate": 1.3384998616108497e-05, + "loss": 0.1036, + "step": 35025 + }, + { + "epoch": 3.43, + "learning_rate": 1.338084694159978e-05, + "loss": 0.0966, + "step": 35030 + }, + { + "epoch": 3.43, + "learning_rate": 1.337669526709106e-05, + "loss": 0.1244, + "step": 35035 + }, + { + "epoch": 3.43, + "learning_rate": 1.3372543592582341e-05, + "loss": 0.0997, + "step": 35040 + }, + { + "epoch": 3.43, + "learning_rate": 1.3368391918073624e-05, + "loss": 0.1132, + "step": 35045 + }, + { + "epoch": 3.43, + "learning_rate": 1.3364240243564904e-05, + "loss": 0.1118, + "step": 35050 + }, + { + "epoch": 3.43, + "learning_rate": 1.3360088569056187e-05, + "loss": 0.1068, + "step": 35055 + }, + { + "epoch": 3.43, + "learning_rate": 1.3355936894547468e-05, + "loss": 0.0863, + "step": 35060 + }, + { + "epoch": 3.43, + "learning_rate": 1.3351785220038748e-05, + "loss": 0.1175, + "step": 35065 + }, + { + "epoch": 3.43, + "learning_rate": 1.334763354553003e-05, + "loss": 0.092, + "step": 35070 + }, + { + "epoch": 3.43, + "learning_rate": 1.3343481871021313e-05, + "loss": 0.0913, + "step": 35075 + }, + { + "epoch": 3.43, + "learning_rate": 1.3339330196512594e-05, + "loss": 0.1146, + "step": 35080 + }, + { + "epoch": 3.43, + "learning_rate": 1.3335178522003875e-05, + "loss": 0.1205, + "step": 35085 + }, + { + "epoch": 3.43, + "learning_rate": 1.3331026847495156e-05, + "loss": 0.1015, + "step": 35090 + }, + { + "epoch": 3.43, + "learning_rate": 1.3326875172986438e-05, + "loss": 0.1033, + "step": 35095 + }, + { + "epoch": 3.43, + "learning_rate": 1.332272349847772e-05, + "loss": 0.1336, + "step": 35100 + }, + { + "epoch": 3.43, + "learning_rate": 1.3318571823969001e-05, + "loss": 0.1018, + "step": 35105 + }, + { + "epoch": 3.43, + "learning_rate": 1.3314420149460282e-05, + "loss": 0.0925, + "step": 35110 + }, + { + "epoch": 3.43, + "learning_rate": 1.3310268474951563e-05, + "loss": 0.1143, + "step": 35115 + }, + { + "epoch": 3.43, + "learning_rate": 1.3306116800442847e-05, + "loss": 0.1176, + "step": 35120 + }, + { + "epoch": 3.43, + "learning_rate": 1.3301965125934128e-05, + "loss": 0.1117, + "step": 35125 + }, + { + "epoch": 3.44, + "learning_rate": 1.3297813451425408e-05, + "loss": 0.1136, + "step": 35130 + }, + { + "epoch": 3.44, + "learning_rate": 1.329366177691669e-05, + "loss": 0.1211, + "step": 35135 + }, + { + "epoch": 3.44, + "learning_rate": 1.3289510102407972e-05, + "loss": 0.0961, + "step": 35140 + }, + { + "epoch": 3.44, + "learning_rate": 1.3285358427899254e-05, + "loss": 0.1008, + "step": 35145 + }, + { + "epoch": 3.44, + "learning_rate": 1.3281206753390535e-05, + "loss": 0.1147, + "step": 35150 + }, + { + "epoch": 3.44, + "learning_rate": 1.3277055078881816e-05, + "loss": 0.0928, + "step": 35155 + }, + { + "epoch": 3.44, + "learning_rate": 1.3272903404373096e-05, + "loss": 0.1116, + "step": 35160 + }, + { + "epoch": 3.44, + "learning_rate": 1.3268751729864379e-05, + "loss": 0.1189, + "step": 35165 + }, + { + "epoch": 3.44, + "learning_rate": 1.3264600055355661e-05, + "loss": 0.1083, + "step": 35170 + }, + { + "epoch": 3.44, + "learning_rate": 1.3260448380846942e-05, + "loss": 0.1153, + "step": 35175 + }, + { + "epoch": 3.44, + "learning_rate": 1.3256296706338223e-05, + "loss": 0.1011, + "step": 35180 + }, + { + "epoch": 3.44, + "learning_rate": 1.3252145031829505e-05, + "loss": 0.1125, + "step": 35185 + }, + { + "epoch": 3.44, + "learning_rate": 1.3247993357320786e-05, + "loss": 0.1031, + "step": 35190 + }, + { + "epoch": 3.44, + "learning_rate": 1.3243841682812069e-05, + "loss": 0.0873, + "step": 35195 + }, + { + "epoch": 3.44, + "learning_rate": 1.323969000830335e-05, + "loss": 0.1229, + "step": 35200 + }, + { + "epoch": 3.44, + "learning_rate": 1.323553833379463e-05, + "loss": 0.1101, + "step": 35205 + }, + { + "epoch": 3.44, + "learning_rate": 1.3231386659285913e-05, + "loss": 0.1026, + "step": 35210 + }, + { + "epoch": 3.44, + "learning_rate": 1.3227234984777193e-05, + "loss": 0.123, + "step": 35215 + }, + { + "epoch": 3.44, + "learning_rate": 1.3223083310268476e-05, + "loss": 0.0978, + "step": 35220 + }, + { + "epoch": 3.44, + "learning_rate": 1.3218931635759757e-05, + "loss": 0.0884, + "step": 35225 + }, + { + "epoch": 3.44, + "learning_rate": 1.3214779961251039e-05, + "loss": 0.0914, + "step": 35230 + }, + { + "epoch": 3.45, + "learning_rate": 1.321062828674232e-05, + "loss": 0.1024, + "step": 35235 + }, + { + "epoch": 3.45, + "learning_rate": 1.32064766122336e-05, + "loss": 0.0987, + "step": 35240 + }, + { + "epoch": 3.45, + "learning_rate": 1.3202324937724881e-05, + "loss": 0.0949, + "step": 35245 + }, + { + "epoch": 3.45, + "learning_rate": 1.3198173263216164e-05, + "loss": 0.124, + "step": 35250 + }, + { + "epoch": 3.45, + "learning_rate": 1.3194021588707446e-05, + "loss": 0.0968, + "step": 35255 + }, + { + "epoch": 3.45, + "learning_rate": 1.3189869914198727e-05, + "loss": 0.0928, + "step": 35260 + }, + { + "epoch": 3.45, + "learning_rate": 1.3185718239690008e-05, + "loss": 0.126, + "step": 35265 + }, + { + "epoch": 3.45, + "learning_rate": 1.3181566565181289e-05, + "loss": 0.1088, + "step": 35270 + }, + { + "epoch": 3.45, + "learning_rate": 1.3177414890672573e-05, + "loss": 0.0974, + "step": 35275 + }, + { + "epoch": 3.45, + "learning_rate": 1.3173263216163854e-05, + "loss": 0.1172, + "step": 35280 + }, + { + "epoch": 3.45, + "learning_rate": 1.3169111541655134e-05, + "loss": 0.1211, + "step": 35285 + }, + { + "epoch": 3.45, + "learning_rate": 1.3164959867146415e-05, + "loss": 0.1005, + "step": 35290 + }, + { + "epoch": 3.45, + "learning_rate": 1.3160808192637698e-05, + "loss": 0.1075, + "step": 35295 + }, + { + "epoch": 3.45, + "learning_rate": 1.315665651812898e-05, + "loss": 0.126, + "step": 35300 + }, + { + "epoch": 3.45, + "learning_rate": 1.315250484362026e-05, + "loss": 0.1048, + "step": 35305 + }, + { + "epoch": 3.45, + "learning_rate": 1.3148353169111542e-05, + "loss": 0.0994, + "step": 35310 + }, + { + "epoch": 3.45, + "learning_rate": 1.3144201494602822e-05, + "loss": 0.0998, + "step": 35315 + }, + { + "epoch": 3.45, + "learning_rate": 1.3140049820094105e-05, + "loss": 0.1169, + "step": 35320 + }, + { + "epoch": 3.45, + "learning_rate": 1.3135898145585387e-05, + "loss": 0.0986, + "step": 35325 + }, + { + "epoch": 3.45, + "learning_rate": 1.3131746471076668e-05, + "loss": 0.1009, + "step": 35330 + }, + { + "epoch": 3.46, + "learning_rate": 1.3127594796567949e-05, + "loss": 0.1302, + "step": 35335 + }, + { + "epoch": 3.46, + "learning_rate": 1.3123443122059231e-05, + "loss": 0.0973, + "step": 35340 + }, + { + "epoch": 3.46, + "learning_rate": 1.3119291447550512e-05, + "loss": 0.1138, + "step": 35345 + }, + { + "epoch": 3.46, + "learning_rate": 1.3115139773041794e-05, + "loss": 0.1394, + "step": 35350 + }, + { + "epoch": 3.46, + "learning_rate": 1.3110988098533075e-05, + "loss": 0.0862, + "step": 35355 + }, + { + "epoch": 3.46, + "learning_rate": 1.3106836424024356e-05, + "loss": 0.1033, + "step": 35360 + }, + { + "epoch": 3.46, + "learning_rate": 1.3102684749515638e-05, + "loss": 0.1035, + "step": 35365 + }, + { + "epoch": 3.46, + "learning_rate": 1.309853307500692e-05, + "loss": 0.0999, + "step": 35370 + }, + { + "epoch": 3.46, + "learning_rate": 1.3094381400498202e-05, + "loss": 0.0867, + "step": 35375 + }, + { + "epoch": 3.46, + "learning_rate": 1.3090229725989482e-05, + "loss": 0.1066, + "step": 35380 + }, + { + "epoch": 3.46, + "learning_rate": 1.3086078051480765e-05, + "loss": 0.1251, + "step": 35385 + }, + { + "epoch": 3.46, + "learning_rate": 1.3081926376972046e-05, + "loss": 0.0931, + "step": 35390 + }, + { + "epoch": 3.46, + "learning_rate": 1.3077774702463326e-05, + "loss": 0.0808, + "step": 35395 + }, + { + "epoch": 3.46, + "learning_rate": 1.3073623027954609e-05, + "loss": 0.128, + "step": 35400 + }, + { + "epoch": 3.46, + "learning_rate": 1.3069471353445891e-05, + "loss": 0.1055, + "step": 35405 + }, + { + "epoch": 3.46, + "learning_rate": 1.3065319678937172e-05, + "loss": 0.0982, + "step": 35410 + }, + { + "epoch": 3.46, + "learning_rate": 1.3061168004428453e-05, + "loss": 0.1275, + "step": 35415 + }, + { + "epoch": 3.46, + "learning_rate": 1.3057016329919734e-05, + "loss": 0.0978, + "step": 35420 + }, + { + "epoch": 3.46, + "learning_rate": 1.3052864655411016e-05, + "loss": 0.0839, + "step": 35425 + }, + { + "epoch": 3.46, + "learning_rate": 1.3048712980902299e-05, + "loss": 0.1133, + "step": 35430 + }, + { + "epoch": 3.46, + "learning_rate": 1.304456130639358e-05, + "loss": 0.1265, + "step": 35435 + }, + { + "epoch": 3.47, + "learning_rate": 1.304040963188486e-05, + "loss": 0.1023, + "step": 35440 + }, + { + "epoch": 3.47, + "learning_rate": 1.3036257957376141e-05, + "loss": 0.1135, + "step": 35445 + }, + { + "epoch": 3.47, + "learning_rate": 1.3032106282867423e-05, + "loss": 0.1199, + "step": 35450 + }, + { + "epoch": 3.47, + "learning_rate": 1.3027954608358706e-05, + "loss": 0.1, + "step": 35455 + }, + { + "epoch": 3.47, + "learning_rate": 1.3023802933849987e-05, + "loss": 0.1058, + "step": 35460 + }, + { + "epoch": 3.47, + "learning_rate": 1.3019651259341267e-05, + "loss": 0.1487, + "step": 35465 + }, + { + "epoch": 3.47, + "learning_rate": 1.3015499584832548e-05, + "loss": 0.1055, + "step": 35470 + }, + { + "epoch": 3.47, + "learning_rate": 1.301134791032383e-05, + "loss": 0.0917, + "step": 35475 + }, + { + "epoch": 3.47, + "learning_rate": 1.3007196235815113e-05, + "loss": 0.0948, + "step": 35480 + }, + { + "epoch": 3.47, + "learning_rate": 1.3003044561306394e-05, + "loss": 0.1243, + "step": 35485 + }, + { + "epoch": 3.47, + "learning_rate": 1.2998892886797675e-05, + "loss": 0.0931, + "step": 35490 + }, + { + "epoch": 3.47, + "learning_rate": 1.2994741212288957e-05, + "loss": 0.1053, + "step": 35495 + }, + { + "epoch": 3.47, + "learning_rate": 1.2990589537780238e-05, + "loss": 0.1264, + "step": 35500 + }, + { + "epoch": 3.47, + "eval_cer": 0.05687202147658456, + "eval_loss": 0.23485976457595825, + "eval_runtime": 275.777, + "eval_samples_per_second": 59.36, + "eval_steps_per_second": 1.65, + "eval_wer": 0.14489072304969866, + "step": 35500 + }, + { + "epoch": 3.47, + "learning_rate": 1.298643786327152e-05, + "loss": 0.1102, + "step": 35505 + }, + { + "epoch": 3.47, + "learning_rate": 1.2982286188762801e-05, + "loss": 0.0943, + "step": 35510 + }, + { + "epoch": 3.47, + "learning_rate": 1.2978134514254084e-05, + "loss": 0.1019, + "step": 35515 + }, + { + "epoch": 3.47, + "learning_rate": 1.2973982839745364e-05, + "loss": 0.1027, + "step": 35520 + }, + { + "epoch": 3.47, + "learning_rate": 1.2969831165236645e-05, + "loss": 0.1001, + "step": 35525 + }, + { + "epoch": 3.47, + "learning_rate": 1.2965679490727928e-05, + "loss": 0.1143, + "step": 35530 + }, + { + "epoch": 3.47, + "learning_rate": 1.2961527816219208e-05, + "loss": 0.1255, + "step": 35535 + }, + { + "epoch": 3.48, + "learning_rate": 1.295737614171049e-05, + "loss": 0.0889, + "step": 35540 + }, + { + "epoch": 3.48, + "learning_rate": 1.2953224467201772e-05, + "loss": 0.1011, + "step": 35545 + }, + { + "epoch": 3.48, + "learning_rate": 1.2949072792693052e-05, + "loss": 0.1059, + "step": 35550 + }, + { + "epoch": 3.48, + "learning_rate": 1.2944921118184335e-05, + "loss": 0.0989, + "step": 35555 + }, + { + "epoch": 3.48, + "learning_rate": 1.2940769443675617e-05, + "loss": 0.0918, + "step": 35560 + }, + { + "epoch": 3.48, + "learning_rate": 1.2936617769166898e-05, + "loss": 0.1328, + "step": 35565 + }, + { + "epoch": 3.48, + "learning_rate": 1.2932466094658179e-05, + "loss": 0.1062, + "step": 35570 + }, + { + "epoch": 3.48, + "learning_rate": 1.292831442014946e-05, + "loss": 0.0997, + "step": 35575 + }, + { + "epoch": 3.48, + "learning_rate": 1.2924162745640742e-05, + "loss": 0.1049, + "step": 35580 + }, + { + "epoch": 3.48, + "learning_rate": 1.2920011071132024e-05, + "loss": 0.0999, + "step": 35585 + }, + { + "epoch": 3.48, + "learning_rate": 1.2915859396623305e-05, + "loss": 0.0943, + "step": 35590 + }, + { + "epoch": 3.48, + "learning_rate": 1.2911707722114586e-05, + "loss": 0.0939, + "step": 35595 + }, + { + "epoch": 3.48, + "learning_rate": 1.2907556047605867e-05, + "loss": 0.1247, + "step": 35600 + }, + { + "epoch": 3.48, + "learning_rate": 1.2903404373097151e-05, + "loss": 0.1002, + "step": 35605 + }, + { + "epoch": 3.48, + "learning_rate": 1.2899252698588432e-05, + "loss": 0.1007, + "step": 35610 + }, + { + "epoch": 3.48, + "learning_rate": 1.2895101024079712e-05, + "loss": 0.1281, + "step": 35615 + }, + { + "epoch": 3.48, + "learning_rate": 1.2890949349570993e-05, + "loss": 0.1017, + "step": 35620 + }, + { + "epoch": 3.48, + "learning_rate": 1.2886797675062276e-05, + "loss": 0.085, + "step": 35625 + }, + { + "epoch": 3.48, + "learning_rate": 1.2882646000553558e-05, + "loss": 0.1008, + "step": 35630 + }, + { + "epoch": 3.48, + "learning_rate": 1.2878494326044839e-05, + "loss": 0.1099, + "step": 35635 + }, + { + "epoch": 3.49, + "learning_rate": 1.287434265153612e-05, + "loss": 0.1076, + "step": 35640 + }, + { + "epoch": 3.49, + "learning_rate": 1.28701909770274e-05, + "loss": 0.1005, + "step": 35645 + }, + { + "epoch": 3.49, + "learning_rate": 1.2866039302518683e-05, + "loss": 0.1229, + "step": 35650 + }, + { + "epoch": 3.49, + "learning_rate": 1.2861887628009964e-05, + "loss": 0.0939, + "step": 35655 + }, + { + "epoch": 3.49, + "learning_rate": 1.2857735953501246e-05, + "loss": 0.097, + "step": 35660 + }, + { + "epoch": 3.49, + "learning_rate": 1.2853584278992527e-05, + "loss": 0.1165, + "step": 35665 + }, + { + "epoch": 3.49, + "learning_rate": 1.284943260448381e-05, + "loss": 0.1118, + "step": 35670 + }, + { + "epoch": 3.49, + "learning_rate": 1.284528092997509e-05, + "loss": 0.0986, + "step": 35675 + }, + { + "epoch": 3.49, + "learning_rate": 1.2841129255466371e-05, + "loss": 0.0946, + "step": 35680 + }, + { + "epoch": 3.49, + "learning_rate": 1.2836977580957653e-05, + "loss": 0.1262, + "step": 35685 + }, + { + "epoch": 3.49, + "learning_rate": 1.2832825906448934e-05, + "loss": 0.094, + "step": 35690 + }, + { + "epoch": 3.49, + "learning_rate": 1.2828674231940217e-05, + "loss": 0.098, + "step": 35695 + }, + { + "epoch": 3.49, + "learning_rate": 1.2824522557431497e-05, + "loss": 0.1113, + "step": 35700 + }, + { + "epoch": 3.49, + "learning_rate": 1.2820370882922778e-05, + "loss": 0.1018, + "step": 35705 + }, + { + "epoch": 3.49, + "learning_rate": 1.281621920841406e-05, + "loss": 0.0992, + "step": 35710 + }, + { + "epoch": 3.49, + "learning_rate": 1.2812067533905343e-05, + "loss": 0.1074, + "step": 35715 + }, + { + "epoch": 3.49, + "learning_rate": 1.2807915859396624e-05, + "loss": 0.1036, + "step": 35720 + }, + { + "epoch": 3.49, + "learning_rate": 1.2803764184887905e-05, + "loss": 0.0835, + "step": 35725 + }, + { + "epoch": 3.49, + "learning_rate": 1.2799612510379185e-05, + "loss": 0.1006, + "step": 35730 + }, + { + "epoch": 3.49, + "learning_rate": 1.279546083587047e-05, + "loss": 0.1139, + "step": 35735 + }, + { + "epoch": 3.49, + "learning_rate": 1.279130916136175e-05, + "loss": 0.1214, + "step": 35740 + }, + { + "epoch": 3.5, + "learning_rate": 1.2787157486853031e-05, + "loss": 0.1035, + "step": 35745 + }, + { + "epoch": 3.5, + "learning_rate": 1.2783005812344312e-05, + "loss": 0.1198, + "step": 35750 + }, + { + "epoch": 3.5, + "learning_rate": 1.2778854137835593e-05, + "loss": 0.0998, + "step": 35755 + }, + { + "epoch": 3.5, + "learning_rate": 1.2774702463326877e-05, + "loss": 0.0802, + "step": 35760 + }, + { + "epoch": 3.5, + "learning_rate": 1.2770550788818158e-05, + "loss": 0.1131, + "step": 35765 + }, + { + "epoch": 3.5, + "learning_rate": 1.2766399114309438e-05, + "loss": 0.1213, + "step": 35770 + }, + { + "epoch": 3.5, + "learning_rate": 1.2762247439800719e-05, + "loss": 0.0969, + "step": 35775 + }, + { + "epoch": 3.5, + "learning_rate": 1.2758095765292002e-05, + "loss": 0.113, + "step": 35780 + }, + { + "epoch": 3.5, + "learning_rate": 1.2753944090783284e-05, + "loss": 0.1168, + "step": 35785 + }, + { + "epoch": 3.5, + "learning_rate": 1.2749792416274565e-05, + "loss": 0.1038, + "step": 35790 + }, + { + "epoch": 3.5, + "learning_rate": 1.2745640741765846e-05, + "loss": 0.0889, + "step": 35795 + }, + { + "epoch": 3.5, + "learning_rate": 1.2741489067257126e-05, + "loss": 0.1089, + "step": 35800 + }, + { + "epoch": 3.5, + "learning_rate": 1.2737337392748409e-05, + "loss": 0.1056, + "step": 35805 + }, + { + "epoch": 3.5, + "learning_rate": 1.2733185718239691e-05, + "loss": 0.0857, + "step": 35810 + }, + { + "epoch": 3.5, + "learning_rate": 1.2729034043730972e-05, + "loss": 0.1128, + "step": 35815 + }, + { + "epoch": 3.5, + "learning_rate": 1.2724882369222253e-05, + "loss": 0.1066, + "step": 35820 + }, + { + "epoch": 3.5, + "learning_rate": 1.2720730694713535e-05, + "loss": 0.0878, + "step": 35825 + }, + { + "epoch": 3.5, + "learning_rate": 1.2716579020204816e-05, + "loss": 0.1055, + "step": 35830 + }, + { + "epoch": 3.5, + "learning_rate": 1.2712427345696098e-05, + "loss": 0.1229, + "step": 35835 + }, + { + "epoch": 3.5, + "learning_rate": 1.270827567118738e-05, + "loss": 0.0981, + "step": 35840 + }, + { + "epoch": 3.51, + "learning_rate": 1.2704123996678662e-05, + "loss": 0.1006, + "step": 35845 + }, + { + "epoch": 3.51, + "learning_rate": 1.2699972322169942e-05, + "loss": 0.1286, + "step": 35850 + }, + { + "epoch": 3.51, + "learning_rate": 1.2695820647661223e-05, + "loss": 0.1004, + "step": 35855 + }, + { + "epoch": 3.51, + "learning_rate": 1.2691668973152504e-05, + "loss": 0.1131, + "step": 35860 + }, + { + "epoch": 3.51, + "learning_rate": 1.2687517298643786e-05, + "loss": 0.1082, + "step": 35865 + }, + { + "epoch": 3.51, + "learning_rate": 1.2683365624135069e-05, + "loss": 0.1158, + "step": 35870 + }, + { + "epoch": 3.51, + "learning_rate": 1.267921394962635e-05, + "loss": 0.1029, + "step": 35875 + }, + { + "epoch": 3.51, + "learning_rate": 1.267506227511763e-05, + "loss": 0.1325, + "step": 35880 + }, + { + "epoch": 3.51, + "learning_rate": 1.2670910600608911e-05, + "loss": 0.1127, + "step": 35885 + }, + { + "epoch": 3.51, + "learning_rate": 1.2666758926100195e-05, + "loss": 0.0992, + "step": 35890 + }, + { + "epoch": 3.51, + "learning_rate": 1.2662607251591476e-05, + "loss": 0.1076, + "step": 35895 + }, + { + "epoch": 3.51, + "learning_rate": 1.2658455577082757e-05, + "loss": 0.1268, + "step": 35900 + }, + { + "epoch": 3.51, + "learning_rate": 1.2654303902574038e-05, + "loss": 0.1005, + "step": 35905 + }, + { + "epoch": 3.51, + "learning_rate": 1.2650152228065318e-05, + "loss": 0.1105, + "step": 35910 + }, + { + "epoch": 3.51, + "learning_rate": 1.2646000553556603e-05, + "loss": 0.123, + "step": 35915 + }, + { + "epoch": 3.51, + "learning_rate": 1.2641848879047883e-05, + "loss": 0.1063, + "step": 35920 + }, + { + "epoch": 3.51, + "learning_rate": 1.2637697204539164e-05, + "loss": 0.1047, + "step": 35925 + }, + { + "epoch": 3.51, + "learning_rate": 1.2633545530030445e-05, + "loss": 0.1075, + "step": 35930 + }, + { + "epoch": 3.51, + "learning_rate": 1.2629393855521727e-05, + "loss": 0.1174, + "step": 35935 + }, + { + "epoch": 3.51, + "learning_rate": 1.262524218101301e-05, + "loss": 0.0907, + "step": 35940 + }, + { + "epoch": 3.51, + "learning_rate": 1.262109050650429e-05, + "loss": 0.0885, + "step": 35945 + }, + { + "epoch": 3.52, + "learning_rate": 1.2616938831995571e-05, + "loss": 0.1088, + "step": 35950 + }, + { + "epoch": 3.52, + "learning_rate": 1.2612787157486854e-05, + "loss": 0.0863, + "step": 35955 + }, + { + "epoch": 3.52, + "learning_rate": 1.2608635482978135e-05, + "loss": 0.0778, + "step": 35960 + }, + { + "epoch": 3.52, + "learning_rate": 1.2604483808469417e-05, + "loss": 0.1166, + "step": 35965 + }, + { + "epoch": 3.52, + "learning_rate": 1.2600332133960698e-05, + "loss": 0.0973, + "step": 35970 + }, + { + "epoch": 3.52, + "learning_rate": 1.2596180459451979e-05, + "loss": 0.0922, + "step": 35975 + }, + { + "epoch": 3.52, + "learning_rate": 1.2592028784943261e-05, + "loss": 0.0991, + "step": 35980 + }, + { + "epoch": 3.52, + "learning_rate": 1.2587877110434542e-05, + "loss": 0.1264, + "step": 35985 + }, + { + "epoch": 3.52, + "learning_rate": 1.2583725435925824e-05, + "loss": 0.0947, + "step": 35990 + }, + { + "epoch": 3.52, + "learning_rate": 1.2579573761417105e-05, + "loss": 0.0941, + "step": 35995 + }, + { + "epoch": 3.52, + "learning_rate": 1.2575422086908388e-05, + "loss": 0.1325, + "step": 36000 + }, + { + "epoch": 3.52, + "eval_cer": 0.056739064584677354, + "eval_loss": 0.23321078717708588, + "eval_runtime": 272.1507, + "eval_samples_per_second": 60.15, + "eval_steps_per_second": 1.672, + "eval_wer": 0.14581796099070804, + "step": 36000 + }, + { + "epoch": 3.52, + "learning_rate": 1.2571270412399668e-05, + "loss": 0.1067, + "step": 36005 + }, + { + "epoch": 3.52, + "learning_rate": 1.2567118737890949e-05, + "loss": 0.0987, + "step": 36010 + }, + { + "epoch": 3.52, + "learning_rate": 1.2562967063382232e-05, + "loss": 0.1014, + "step": 36015 + }, + { + "epoch": 3.52, + "learning_rate": 1.2558815388873512e-05, + "loss": 0.1156, + "step": 36020 + }, + { + "epoch": 3.52, + "learning_rate": 1.2554663714364795e-05, + "loss": 0.0932, + "step": 36025 + }, + { + "epoch": 3.52, + "learning_rate": 1.2550512039856076e-05, + "loss": 0.0914, + "step": 36030 + }, + { + "epoch": 3.52, + "learning_rate": 1.2546360365347356e-05, + "loss": 0.1285, + "step": 36035 + }, + { + "epoch": 3.52, + "learning_rate": 1.2542208690838639e-05, + "loss": 0.0971, + "step": 36040 + }, + { + "epoch": 3.52, + "learning_rate": 1.2538057016329921e-05, + "loss": 0.0981, + "step": 36045 + }, + { + "epoch": 3.53, + "learning_rate": 1.2533905341821202e-05, + "loss": 0.1144, + "step": 36050 + }, + { + "epoch": 3.53, + "learning_rate": 1.2529753667312483e-05, + "loss": 0.1043, + "step": 36055 + }, + { + "epoch": 3.53, + "learning_rate": 1.2525601992803764e-05, + "loss": 0.097, + "step": 36060 + }, + { + "epoch": 3.53, + "learning_rate": 1.2521450318295046e-05, + "loss": 0.1174, + "step": 36065 + }, + { + "epoch": 3.53, + "learning_rate": 1.2517298643786328e-05, + "loss": 0.1081, + "step": 36070 + }, + { + "epoch": 3.53, + "learning_rate": 1.251314696927761e-05, + "loss": 0.1003, + "step": 36075 + }, + { + "epoch": 3.53, + "learning_rate": 1.250899529476889e-05, + "loss": 0.1068, + "step": 36080 + }, + { + "epoch": 3.53, + "learning_rate": 1.250484362026017e-05, + "loss": 0.1202, + "step": 36085 + }, + { + "epoch": 3.53, + "learning_rate": 1.2500691945751453e-05, + "loss": 0.0941, + "step": 36090 + }, + { + "epoch": 3.53, + "learning_rate": 1.2496540271242736e-05, + "loss": 0.0845, + "step": 36095 + }, + { + "epoch": 3.53, + "learning_rate": 1.2492388596734016e-05, + "loss": 0.1118, + "step": 36100 + }, + { + "epoch": 3.53, + "learning_rate": 1.2488236922225297e-05, + "loss": 0.0894, + "step": 36105 + }, + { + "epoch": 3.53, + "learning_rate": 1.248408524771658e-05, + "loss": 0.1033, + "step": 36110 + }, + { + "epoch": 3.53, + "learning_rate": 1.247993357320786e-05, + "loss": 0.109, + "step": 36115 + }, + { + "epoch": 3.53, + "learning_rate": 1.2475781898699143e-05, + "loss": 0.112, + "step": 36120 + }, + { + "epoch": 3.53, + "learning_rate": 1.2471630224190424e-05, + "loss": 0.0935, + "step": 36125 + }, + { + "epoch": 3.53, + "learning_rate": 1.2467478549681704e-05, + "loss": 0.0992, + "step": 36130 + }, + { + "epoch": 3.53, + "learning_rate": 1.2463326875172987e-05, + "loss": 0.1085, + "step": 36135 + }, + { + "epoch": 3.53, + "learning_rate": 1.2459175200664268e-05, + "loss": 0.0921, + "step": 36140 + }, + { + "epoch": 3.53, + "learning_rate": 1.245502352615555e-05, + "loss": 0.0994, + "step": 36145 + }, + { + "epoch": 3.53, + "learning_rate": 1.2450871851646831e-05, + "loss": 0.127, + "step": 36150 + }, + { + "epoch": 3.54, + "learning_rate": 1.2446720177138113e-05, + "loss": 0.0993, + "step": 36155 + }, + { + "epoch": 3.54, + "learning_rate": 1.2442568502629394e-05, + "loss": 0.0887, + "step": 36160 + }, + { + "epoch": 3.54, + "learning_rate": 1.2438416828120675e-05, + "loss": 0.1101, + "step": 36165 + }, + { + "epoch": 3.54, + "learning_rate": 1.2434265153611957e-05, + "loss": 0.0879, + "step": 36170 + }, + { + "epoch": 3.54, + "learning_rate": 1.2430113479103238e-05, + "loss": 0.0921, + "step": 36175 + }, + { + "epoch": 3.54, + "learning_rate": 1.242596180459452e-05, + "loss": 0.1032, + "step": 36180 + }, + { + "epoch": 3.54, + "learning_rate": 1.2421810130085801e-05, + "loss": 0.1296, + "step": 36185 + }, + { + "epoch": 3.54, + "learning_rate": 1.2417658455577082e-05, + "loss": 0.0893, + "step": 36190 + }, + { + "epoch": 3.54, + "learning_rate": 1.2413506781068365e-05, + "loss": 0.1057, + "step": 36195 + }, + { + "epoch": 3.54, + "learning_rate": 1.2409355106559647e-05, + "loss": 0.1175, + "step": 36200 + }, + { + "epoch": 3.54, + "learning_rate": 1.2405203432050928e-05, + "loss": 0.107, + "step": 36205 + }, + { + "epoch": 3.54, + "learning_rate": 1.2401051757542209e-05, + "loss": 0.0892, + "step": 36210 + }, + { + "epoch": 3.54, + "learning_rate": 1.239690008303349e-05, + "loss": 0.1273, + "step": 36215 + }, + { + "epoch": 3.54, + "learning_rate": 1.2392748408524774e-05, + "loss": 0.0958, + "step": 36220 + }, + { + "epoch": 3.54, + "learning_rate": 1.2388596734016054e-05, + "loss": 0.0987, + "step": 36225 + }, + { + "epoch": 3.54, + "learning_rate": 1.2384445059507335e-05, + "loss": 0.1003, + "step": 36230 + }, + { + "epoch": 3.54, + "learning_rate": 1.2380293384998616e-05, + "loss": 0.1166, + "step": 36235 + }, + { + "epoch": 3.54, + "learning_rate": 1.2376141710489897e-05, + "loss": 0.0984, + "step": 36240 + }, + { + "epoch": 3.54, + "learning_rate": 1.237199003598118e-05, + "loss": 0.1031, + "step": 36245 + }, + { + "epoch": 3.54, + "learning_rate": 1.2367838361472462e-05, + "loss": 0.1197, + "step": 36250 + }, + { + "epoch": 3.55, + "learning_rate": 1.2363686686963742e-05, + "loss": 0.0957, + "step": 36255 + }, + { + "epoch": 3.55, + "learning_rate": 1.2359535012455023e-05, + "loss": 0.0865, + "step": 36260 + }, + { + "epoch": 3.55, + "learning_rate": 1.2355383337946306e-05, + "loss": 0.1081, + "step": 36265 + }, + { + "epoch": 3.55, + "learning_rate": 1.2351231663437586e-05, + "loss": 0.1006, + "step": 36270 + }, + { + "epoch": 3.55, + "learning_rate": 1.2347079988928869e-05, + "loss": 0.1044, + "step": 36275 + }, + { + "epoch": 3.55, + "learning_rate": 1.234292831442015e-05, + "loss": 0.118, + "step": 36280 + }, + { + "epoch": 3.55, + "learning_rate": 1.233877663991143e-05, + "loss": 0.1114, + "step": 36285 + }, + { + "epoch": 3.55, + "learning_rate": 1.2334624965402713e-05, + "loss": 0.1005, + "step": 36290 + }, + { + "epoch": 3.55, + "learning_rate": 1.2330473290893994e-05, + "loss": 0.1105, + "step": 36295 + }, + { + "epoch": 3.55, + "learning_rate": 1.2326321616385276e-05, + "loss": 0.1199, + "step": 36300 + }, + { + "epoch": 3.55, + "learning_rate": 1.2322169941876557e-05, + "loss": 0.1147, + "step": 36305 + }, + { + "epoch": 3.55, + "learning_rate": 1.231801826736784e-05, + "loss": 0.0967, + "step": 36310 + }, + { + "epoch": 3.55, + "learning_rate": 1.231386659285912e-05, + "loss": 0.1099, + "step": 36315 + }, + { + "epoch": 3.55, + "learning_rate": 1.23097149183504e-05, + "loss": 0.0955, + "step": 36320 + }, + { + "epoch": 3.55, + "learning_rate": 1.2305563243841683e-05, + "loss": 0.0974, + "step": 36325 + }, + { + "epoch": 3.55, + "learning_rate": 1.2301411569332966e-05, + "loss": 0.1218, + "step": 36330 + }, + { + "epoch": 3.55, + "learning_rate": 1.2297259894824246e-05, + "loss": 0.1115, + "step": 36335 + }, + { + "epoch": 3.55, + "learning_rate": 1.2293108220315527e-05, + "loss": 0.0862, + "step": 36340 + }, + { + "epoch": 3.55, + "learning_rate": 1.2288956545806808e-05, + "loss": 0.0902, + "step": 36345 + }, + { + "epoch": 3.55, + "learning_rate": 1.228480487129809e-05, + "loss": 0.1055, + "step": 36350 + }, + { + "epoch": 3.55, + "learning_rate": 1.2280653196789373e-05, + "loss": 0.1071, + "step": 36355 + }, + { + "epoch": 3.56, + "learning_rate": 1.2276501522280654e-05, + "loss": 0.0873, + "step": 36360 + }, + { + "epoch": 3.56, + "learning_rate": 1.2272349847771934e-05, + "loss": 0.1063, + "step": 36365 + }, + { + "epoch": 3.56, + "learning_rate": 1.2268198173263215e-05, + "loss": 0.1053, + "step": 36370 + }, + { + "epoch": 3.56, + "learning_rate": 1.22640464987545e-05, + "loss": 0.0758, + "step": 36375 + }, + { + "epoch": 3.56, + "learning_rate": 1.225989482424578e-05, + "loss": 0.0853, + "step": 36380 + }, + { + "epoch": 3.56, + "learning_rate": 1.2255743149737061e-05, + "loss": 0.1173, + "step": 36385 + }, + { + "epoch": 3.56, + "learning_rate": 1.2251591475228342e-05, + "loss": 0.0894, + "step": 36390 + }, + { + "epoch": 3.56, + "learning_rate": 1.2247439800719622e-05, + "loss": 0.1018, + "step": 36395 + }, + { + "epoch": 3.56, + "learning_rate": 1.2243288126210907e-05, + "loss": 0.109, + "step": 36400 + }, + { + "epoch": 3.56, + "learning_rate": 1.2239136451702187e-05, + "loss": 0.0914, + "step": 36405 + }, + { + "epoch": 3.56, + "learning_rate": 1.2234984777193468e-05, + "loss": 0.0897, + "step": 36410 + }, + { + "epoch": 3.56, + "learning_rate": 1.2230833102684749e-05, + "loss": 0.1267, + "step": 36415 + }, + { + "epoch": 3.56, + "learning_rate": 1.2226681428176031e-05, + "loss": 0.1109, + "step": 36420 + }, + { + "epoch": 3.56, + "learning_rate": 1.2222529753667314e-05, + "loss": 0.0965, + "step": 36425 + }, + { + "epoch": 3.56, + "learning_rate": 1.2218378079158595e-05, + "loss": 0.0969, + "step": 36430 + }, + { + "epoch": 3.56, + "learning_rate": 1.2214226404649875e-05, + "loss": 0.1128, + "step": 36435 + }, + { + "epoch": 3.56, + "learning_rate": 1.2210074730141158e-05, + "loss": 0.0983, + "step": 36440 + }, + { + "epoch": 3.56, + "learning_rate": 1.2205923055632439e-05, + "loss": 0.0976, + "step": 36445 + }, + { + "epoch": 3.56, + "learning_rate": 1.2201771381123721e-05, + "loss": 0.1177, + "step": 36450 + }, + { + "epoch": 3.56, + "learning_rate": 1.2197619706615002e-05, + "loss": 0.1086, + "step": 36455 + }, + { + "epoch": 3.57, + "learning_rate": 1.2193468032106283e-05, + "loss": 0.0981, + "step": 36460 + }, + { + "epoch": 3.57, + "learning_rate": 1.2189316357597565e-05, + "loss": 0.1249, + "step": 36465 + }, + { + "epoch": 3.57, + "learning_rate": 1.2185164683088846e-05, + "loss": 0.0964, + "step": 36470 + }, + { + "epoch": 3.57, + "learning_rate": 1.2181013008580127e-05, + "loss": 0.0992, + "step": 36475 + }, + { + "epoch": 3.57, + "learning_rate": 1.2176861334071409e-05, + "loss": 0.0856, + "step": 36480 + }, + { + "epoch": 3.57, + "learning_rate": 1.2172709659562692e-05, + "loss": 0.1179, + "step": 36485 + }, + { + "epoch": 3.57, + "learning_rate": 1.2168557985053972e-05, + "loss": 0.0879, + "step": 36490 + }, + { + "epoch": 3.57, + "learning_rate": 1.2164406310545253e-05, + "loss": 0.0894, + "step": 36495 + }, + { + "epoch": 3.57, + "learning_rate": 1.2160254636036534e-05, + "loss": 0.1208, + "step": 36500 + }, + { + "epoch": 3.57, + "eval_cer": 0.05783509183274717, + "eval_loss": 0.23720672726631165, + "eval_runtime": 275.0053, + "eval_samples_per_second": 59.526, + "eval_steps_per_second": 1.655, + "eval_wer": 0.1469215047374023, + "step": 36500 + }, + { + "epoch": 3.57, + "learning_rate": 1.2156102961527816e-05, + "loss": 0.0942, + "step": 36505 + }, + { + "epoch": 3.57, + "learning_rate": 1.2151951287019099e-05, + "loss": 0.1037, + "step": 36510 + }, + { + "epoch": 3.57, + "learning_rate": 1.2148629947412123e-05, + "loss": 0.1292, + "step": 36515 + }, + { + "epoch": 3.57, + "learning_rate": 1.2144478272903404e-05, + "loss": 0.1093, + "step": 36520 + }, + { + "epoch": 3.57, + "learning_rate": 1.2140326598394687e-05, + "loss": 0.0944, + "step": 36525 + }, + { + "epoch": 3.57, + "learning_rate": 1.2136174923885967e-05, + "loss": 0.1259, + "step": 36530 + }, + { + "epoch": 3.57, + "learning_rate": 1.213202324937725e-05, + "loss": 0.1133, + "step": 36535 + }, + { + "epoch": 3.57, + "learning_rate": 1.212787157486853e-05, + "loss": 0.1011, + "step": 36540 + }, + { + "epoch": 3.57, + "learning_rate": 1.2123719900359811e-05, + "loss": 0.1017, + "step": 36545 + }, + { + "epoch": 3.57, + "learning_rate": 1.2119568225851094e-05, + "loss": 0.1346, + "step": 36550 + }, + { + "epoch": 3.57, + "learning_rate": 1.2115416551342375e-05, + "loss": 0.1018, + "step": 36555 + }, + { + "epoch": 3.57, + "learning_rate": 1.2111264876833657e-05, + "loss": 0.1054, + "step": 36560 + }, + { + "epoch": 3.58, + "learning_rate": 1.2107113202324938e-05, + "loss": 0.1149, + "step": 36565 + }, + { + "epoch": 3.58, + "learning_rate": 1.2102961527816219e-05, + "loss": 0.106, + "step": 36570 + }, + { + "epoch": 3.58, + "learning_rate": 1.2098809853307501e-05, + "loss": 0.1075, + "step": 36575 + }, + { + "epoch": 3.58, + "learning_rate": 1.2094658178798784e-05, + "loss": 0.1026, + "step": 36580 + }, + { + "epoch": 3.58, + "learning_rate": 1.2090506504290064e-05, + "loss": 0.1168, + "step": 36585 + }, + { + "epoch": 3.58, + "learning_rate": 1.2086354829781345e-05, + "loss": 0.1102, + "step": 36590 + }, + { + "epoch": 3.58, + "learning_rate": 1.2082203155272626e-05, + "loss": 0.0876, + "step": 36595 + }, + { + "epoch": 3.58, + "learning_rate": 1.207805148076391e-05, + "loss": 0.1218, + "step": 36600 + }, + { + "epoch": 3.58, + "learning_rate": 1.207389980625519e-05, + "loss": 0.0997, + "step": 36605 + }, + { + "epoch": 3.58, + "learning_rate": 1.2069748131746472e-05, + "loss": 0.1029, + "step": 36610 + }, + { + "epoch": 3.58, + "learning_rate": 1.2065596457237752e-05, + "loss": 0.1194, + "step": 36615 + }, + { + "epoch": 3.58, + "learning_rate": 1.2061444782729033e-05, + "loss": 0.0952, + "step": 36620 + }, + { + "epoch": 3.58, + "learning_rate": 1.2057293108220317e-05, + "loss": 0.0906, + "step": 36625 + }, + { + "epoch": 3.58, + "learning_rate": 1.2053141433711598e-05, + "loss": 0.0986, + "step": 36630 + }, + { + "epoch": 3.58, + "learning_rate": 1.2048989759202879e-05, + "loss": 0.1016, + "step": 36635 + }, + { + "epoch": 3.58, + "learning_rate": 1.204483808469416e-05, + "loss": 0.0986, + "step": 36640 + }, + { + "epoch": 3.58, + "learning_rate": 1.2040686410185442e-05, + "loss": 0.0884, + "step": 36645 + }, + { + "epoch": 3.58, + "learning_rate": 1.2036534735676723e-05, + "loss": 0.1183, + "step": 36650 + }, + { + "epoch": 3.58, + "learning_rate": 1.2032383061168005e-05, + "loss": 0.1004, + "step": 36655 + }, + { + "epoch": 3.58, + "learning_rate": 1.2028231386659286e-05, + "loss": 0.0916, + "step": 36660 + }, + { + "epoch": 3.59, + "learning_rate": 1.2024079712150567e-05, + "loss": 0.1126, + "step": 36665 + }, + { + "epoch": 3.59, + "learning_rate": 1.201992803764185e-05, + "loss": 0.0979, + "step": 36670 + }, + { + "epoch": 3.59, + "learning_rate": 1.201577636313313e-05, + "loss": 0.0916, + "step": 36675 + }, + { + "epoch": 3.59, + "learning_rate": 1.2011624688624412e-05, + "loss": 0.097, + "step": 36680 + }, + { + "epoch": 3.59, + "learning_rate": 1.2007473014115693e-05, + "loss": 0.1193, + "step": 36685 + }, + { + "epoch": 3.59, + "learning_rate": 1.2003321339606976e-05, + "loss": 0.0849, + "step": 36690 + }, + { + "epoch": 3.59, + "learning_rate": 1.1999169665098256e-05, + "loss": 0.0978, + "step": 36695 + }, + { + "epoch": 3.59, + "learning_rate": 1.1995017990589537e-05, + "loss": 0.1278, + "step": 36700 + }, + { + "epoch": 3.59, + "learning_rate": 1.199086631608082e-05, + "loss": 0.099, + "step": 36705 + }, + { + "epoch": 3.59, + "learning_rate": 1.1986714641572102e-05, + "loss": 0.1045, + "step": 36710 + }, + { + "epoch": 3.59, + "learning_rate": 1.1982562967063383e-05, + "loss": 0.1032, + "step": 36715 + }, + { + "epoch": 3.59, + "learning_rate": 1.1978411292554664e-05, + "loss": 0.112, + "step": 36720 + }, + { + "epoch": 3.59, + "learning_rate": 1.1974259618045944e-05, + "loss": 0.1198, + "step": 36725 + }, + { + "epoch": 3.59, + "learning_rate": 1.1970107943537227e-05, + "loss": 0.103, + "step": 36730 + }, + { + "epoch": 3.59, + "learning_rate": 1.196595626902851e-05, + "loss": 0.1223, + "step": 36735 + }, + { + "epoch": 3.59, + "learning_rate": 1.196180459451979e-05, + "loss": 0.1061, + "step": 36740 + }, + { + "epoch": 3.59, + "learning_rate": 1.1957652920011071e-05, + "loss": 0.095, + "step": 36745 + }, + { + "epoch": 3.59, + "learning_rate": 1.1953501245502352e-05, + "loss": 0.1125, + "step": 36750 + }, + { + "epoch": 3.59, + "learning_rate": 1.1949349570993636e-05, + "loss": 0.1037, + "step": 36755 + }, + { + "epoch": 3.59, + "learning_rate": 1.1945197896484917e-05, + "loss": 0.0891, + "step": 36760 + }, + { + "epoch": 3.6, + "learning_rate": 1.1941046221976197e-05, + "loss": 0.1056, + "step": 36765 + }, + { + "epoch": 3.6, + "learning_rate": 1.1936894547467478e-05, + "loss": 0.103, + "step": 36770 + }, + { + "epoch": 3.6, + "learning_rate": 1.1932742872958759e-05, + "loss": 0.0944, + "step": 36775 + }, + { + "epoch": 3.6, + "learning_rate": 1.1928591198450043e-05, + "loss": 0.1228, + "step": 36780 + }, + { + "epoch": 3.6, + "learning_rate": 1.1924439523941324e-05, + "loss": 0.1356, + "step": 36785 + }, + { + "epoch": 3.6, + "learning_rate": 1.1920287849432605e-05, + "loss": 0.0968, + "step": 36790 + }, + { + "epoch": 3.6, + "learning_rate": 1.1916136174923885e-05, + "loss": 0.101, + "step": 36795 + }, + { + "epoch": 3.6, + "learning_rate": 1.1911984500415168e-05, + "loss": 0.1338, + "step": 36800 + }, + { + "epoch": 3.6, + "learning_rate": 1.190783282590645e-05, + "loss": 0.105, + "step": 36805 + }, + { + "epoch": 3.6, + "learning_rate": 1.1903681151397731e-05, + "loss": 0.1048, + "step": 36810 + }, + { + "epoch": 3.6, + "learning_rate": 1.1899529476889012e-05, + "loss": 0.1202, + "step": 36815 + }, + { + "epoch": 3.6, + "learning_rate": 1.1895377802380294e-05, + "loss": 0.1082, + "step": 36820 + }, + { + "epoch": 3.6, + "learning_rate": 1.1891226127871575e-05, + "loss": 0.0966, + "step": 36825 + }, + { + "epoch": 3.6, + "learning_rate": 1.1887074453362858e-05, + "loss": 0.1161, + "step": 36830 + }, + { + "epoch": 3.6, + "learning_rate": 1.1882922778854138e-05, + "loss": 0.131, + "step": 36835 + }, + { + "epoch": 3.6, + "learning_rate": 1.1878771104345419e-05, + "loss": 0.0988, + "step": 36840 + }, + { + "epoch": 3.6, + "learning_rate": 1.1874619429836702e-05, + "loss": 0.0948, + "step": 36845 + }, + { + "epoch": 3.6, + "learning_rate": 1.1870467755327982e-05, + "loss": 0.1065, + "step": 36850 + }, + { + "epoch": 3.6, + "learning_rate": 1.1866316080819263e-05, + "loss": 0.0933, + "step": 36855 + }, + { + "epoch": 3.6, + "learning_rate": 1.1862164406310546e-05, + "loss": 0.0981, + "step": 36860 + }, + { + "epoch": 3.6, + "learning_rate": 1.1858012731801828e-05, + "loss": 0.1187, + "step": 36865 + }, + { + "epoch": 3.61, + "learning_rate": 1.1853861057293109e-05, + "loss": 0.0998, + "step": 36870 + }, + { + "epoch": 3.61, + "learning_rate": 1.184970938278439e-05, + "loss": 0.0972, + "step": 36875 + }, + { + "epoch": 3.61, + "learning_rate": 1.184555770827567e-05, + "loss": 0.1059, + "step": 36880 + }, + { + "epoch": 3.61, + "learning_rate": 1.1841406033766953e-05, + "loss": 0.1112, + "step": 36885 + }, + { + "epoch": 3.61, + "learning_rate": 1.1837254359258235e-05, + "loss": 0.0888, + "step": 36890 + }, + { + "epoch": 3.61, + "learning_rate": 1.1833102684749516e-05, + "loss": 0.091, + "step": 36895 + }, + { + "epoch": 3.61, + "learning_rate": 1.1828951010240797e-05, + "loss": 0.1138, + "step": 36900 + }, + { + "epoch": 3.61, + "learning_rate": 1.1824799335732078e-05, + "loss": 0.0945, + "step": 36905 + }, + { + "epoch": 3.61, + "learning_rate": 1.1820647661223362e-05, + "loss": 0.0972, + "step": 36910 + }, + { + "epoch": 3.61, + "learning_rate": 1.1816495986714642e-05, + "loss": 0.1322, + "step": 36915 + }, + { + "epoch": 3.61, + "learning_rate": 1.1812344312205923e-05, + "loss": 0.1118, + "step": 36920 + }, + { + "epoch": 3.61, + "learning_rate": 1.1808192637697204e-05, + "loss": 0.1125, + "step": 36925 + }, + { + "epoch": 3.61, + "learning_rate": 1.1804040963188486e-05, + "loss": 0.1071, + "step": 36930 + }, + { + "epoch": 3.61, + "learning_rate": 1.1799889288679769e-05, + "loss": 0.1123, + "step": 36935 + }, + { + "epoch": 3.61, + "learning_rate": 1.179573761417105e-05, + "loss": 0.0973, + "step": 36940 + }, + { + "epoch": 3.61, + "learning_rate": 1.179158593966233e-05, + "loss": 0.0978, + "step": 36945 + }, + { + "epoch": 3.61, + "learning_rate": 1.1787434265153611e-05, + "loss": 0.1218, + "step": 36950 + }, + { + "epoch": 3.61, + "learning_rate": 1.1783282590644894e-05, + "loss": 0.1076, + "step": 36955 + }, + { + "epoch": 3.61, + "learning_rate": 1.1779130916136176e-05, + "loss": 0.1041, + "step": 36960 + }, + { + "epoch": 3.61, + "learning_rate": 1.1774979241627457e-05, + "loss": 0.1133, + "step": 36965 + }, + { + "epoch": 3.62, + "learning_rate": 1.1770827567118738e-05, + "loss": 0.1139, + "step": 36970 + }, + { + "epoch": 3.62, + "learning_rate": 1.176667589261002e-05, + "loss": 0.0988, + "step": 36975 + }, + { + "epoch": 3.62, + "learning_rate": 1.1762524218101301e-05, + "loss": 0.0883, + "step": 36980 + }, + { + "epoch": 3.62, + "learning_rate": 1.1758372543592583e-05, + "loss": 0.1152, + "step": 36985 + }, + { + "epoch": 3.62, + "learning_rate": 1.1754220869083864e-05, + "loss": 0.0892, + "step": 36990 + }, + { + "epoch": 3.62, + "learning_rate": 1.1750069194575145e-05, + "loss": 0.1086, + "step": 36995 + }, + { + "epoch": 3.62, + "learning_rate": 1.1745917520066427e-05, + "loss": 0.1309, + "step": 37000 + }, + { + "epoch": 3.62, + "eval_cer": 0.05695410790550118, + "eval_loss": 0.2353515326976776, + "eval_runtime": 273.7045, + "eval_samples_per_second": 59.809, + "eval_steps_per_second": 1.662, + "eval_wer": 0.14545881953468326, + "step": 37000 + }, + { + "epoch": 3.62, + "learning_rate": 1.1741765845557708e-05, + "loss": 0.1098, + "step": 37005 + }, + { + "epoch": 3.62, + "learning_rate": 1.173761417104899e-05, + "loss": 0.0905, + "step": 37010 + }, + { + "epoch": 3.62, + "learning_rate": 1.1733462496540271e-05, + "loss": 0.1177, + "step": 37015 + }, + { + "epoch": 3.62, + "learning_rate": 1.1729310822031554e-05, + "loss": 0.1028, + "step": 37020 + }, + { + "epoch": 3.62, + "learning_rate": 1.1725159147522835e-05, + "loss": 0.0903, + "step": 37025 + }, + { + "epoch": 3.62, + "learning_rate": 1.1721007473014115e-05, + "loss": 0.0944, + "step": 37030 + }, + { + "epoch": 3.62, + "learning_rate": 1.1716855798505398e-05, + "loss": 0.1172, + "step": 37035 + }, + { + "epoch": 3.62, + "learning_rate": 1.171270412399668e-05, + "loss": 0.1123, + "step": 37040 + }, + { + "epoch": 3.62, + "learning_rate": 1.1708552449487961e-05, + "loss": 0.0848, + "step": 37045 + }, + { + "epoch": 3.62, + "learning_rate": 1.1704400774979242e-05, + "loss": 0.1335, + "step": 37050 + }, + { + "epoch": 3.62, + "learning_rate": 1.1700249100470523e-05, + "loss": 0.1086, + "step": 37055 + }, + { + "epoch": 3.62, + "learning_rate": 1.1696097425961803e-05, + "loss": 0.0903, + "step": 37060 + }, + { + "epoch": 3.62, + "learning_rate": 1.1691945751453088e-05, + "loss": 0.1186, + "step": 37065 + }, + { + "epoch": 3.62, + "learning_rate": 1.1687794076944368e-05, + "loss": 0.1121, + "step": 37070 + }, + { + "epoch": 3.63, + "learning_rate": 1.1683642402435649e-05, + "loss": 0.1059, + "step": 37075 + }, + { + "epoch": 3.63, + "learning_rate": 1.167949072792693e-05, + "loss": 0.1181, + "step": 37080 + }, + { + "epoch": 3.63, + "learning_rate": 1.1675339053418212e-05, + "loss": 0.1152, + "step": 37085 + }, + { + "epoch": 3.63, + "learning_rate": 1.1671187378909495e-05, + "loss": 0.106, + "step": 37090 + }, + { + "epoch": 3.63, + "learning_rate": 1.1667035704400776e-05, + "loss": 0.107, + "step": 37095 + }, + { + "epoch": 3.63, + "learning_rate": 1.1662884029892056e-05, + "loss": 0.1186, + "step": 37100 + }, + { + "epoch": 3.63, + "learning_rate": 1.1658732355383337e-05, + "loss": 0.0948, + "step": 37105 + }, + { + "epoch": 3.63, + "learning_rate": 1.165458068087462e-05, + "loss": 0.0993, + "step": 37110 + }, + { + "epoch": 3.63, + "learning_rate": 1.1650429006365902e-05, + "loss": 0.1223, + "step": 37115 + }, + { + "epoch": 3.63, + "learning_rate": 1.1646277331857183e-05, + "loss": 0.108, + "step": 37120 + }, + { + "epoch": 3.63, + "learning_rate": 1.1642125657348464e-05, + "loss": 0.0919, + "step": 37125 + }, + { + "epoch": 3.63, + "learning_rate": 1.1637973982839746e-05, + "loss": 0.103, + "step": 37130 + }, + { + "epoch": 3.63, + "learning_rate": 1.1633822308331027e-05, + "loss": 0.1157, + "step": 37135 + }, + { + "epoch": 3.63, + "learning_rate": 1.162967063382231e-05, + "loss": 0.1004, + "step": 37140 + }, + { + "epoch": 3.63, + "learning_rate": 1.162551895931359e-05, + "loss": 0.0921, + "step": 37145 + }, + { + "epoch": 3.63, + "learning_rate": 1.162136728480487e-05, + "loss": 0.1238, + "step": 37150 + }, + { + "epoch": 3.63, + "learning_rate": 1.1617215610296153e-05, + "loss": 0.0965, + "step": 37155 + }, + { + "epoch": 3.63, + "learning_rate": 1.1613063935787434e-05, + "loss": 0.0925, + "step": 37160 + }, + { + "epoch": 3.63, + "learning_rate": 1.1608912261278716e-05, + "loss": 0.1314, + "step": 37165 + }, + { + "epoch": 3.63, + "learning_rate": 1.1604760586769997e-05, + "loss": 0.1164, + "step": 37170 + }, + { + "epoch": 3.64, + "learning_rate": 1.160060891226128e-05, + "loss": 0.1023, + "step": 37175 + }, + { + "epoch": 3.64, + "learning_rate": 1.159645723775256e-05, + "loss": 0.0933, + "step": 37180 + }, + { + "epoch": 3.64, + "learning_rate": 1.1592305563243841e-05, + "loss": 0.1088, + "step": 37185 + }, + { + "epoch": 3.64, + "learning_rate": 1.1588153888735124e-05, + "loss": 0.1041, + "step": 37190 + }, + { + "epoch": 3.64, + "learning_rate": 1.1584002214226406e-05, + "loss": 0.1096, + "step": 37195 + }, + { + "epoch": 3.64, + "learning_rate": 1.1579850539717687e-05, + "loss": 0.1124, + "step": 37200 + }, + { + "epoch": 3.64, + "learning_rate": 1.1575698865208968e-05, + "loss": 0.1006, + "step": 37205 + }, + { + "epoch": 3.64, + "learning_rate": 1.1571547190700248e-05, + "loss": 0.0901, + "step": 37210 + }, + { + "epoch": 3.64, + "learning_rate": 1.1567395516191531e-05, + "loss": 0.1087, + "step": 37215 + }, + { + "epoch": 3.64, + "learning_rate": 1.1563243841682813e-05, + "loss": 0.1114, + "step": 37220 + }, + { + "epoch": 3.64, + "learning_rate": 1.1559092167174094e-05, + "loss": 0.0905, + "step": 37225 + }, + { + "epoch": 3.64, + "learning_rate": 1.1554940492665375e-05, + "loss": 0.082, + "step": 37230 + }, + { + "epoch": 3.64, + "learning_rate": 1.1550788818156656e-05, + "loss": 0.1161, + "step": 37235 + }, + { + "epoch": 3.64, + "learning_rate": 1.154663714364794e-05, + "loss": 0.1026, + "step": 37240 + }, + { + "epoch": 3.64, + "learning_rate": 1.154248546913922e-05, + "loss": 0.1088, + "step": 37245 + }, + { + "epoch": 3.64, + "learning_rate": 1.1538333794630501e-05, + "loss": 0.121, + "step": 37250 + }, + { + "epoch": 3.64, + "learning_rate": 1.1534182120121782e-05, + "loss": 0.1023, + "step": 37255 + }, + { + "epoch": 3.64, + "learning_rate": 1.1530030445613063e-05, + "loss": 0.1086, + "step": 37260 + }, + { + "epoch": 3.64, + "learning_rate": 1.1525878771104345e-05, + "loss": 0.1155, + "step": 37265 + }, + { + "epoch": 3.64, + "learning_rate": 1.1521727096595628e-05, + "loss": 0.1115, + "step": 37270 + }, + { + "epoch": 3.64, + "learning_rate": 1.1517575422086909e-05, + "loss": 0.1196, + "step": 37275 + }, + { + "epoch": 3.65, + "learning_rate": 1.151342374757819e-05, + "loss": 0.119, + "step": 37280 + }, + { + "epoch": 3.65, + "learning_rate": 1.1509272073069472e-05, + "loss": 0.1186, + "step": 37285 + }, + { + "epoch": 3.65, + "learning_rate": 1.1505120398560753e-05, + "loss": 0.1088, + "step": 37290 + }, + { + "epoch": 3.65, + "learning_rate": 1.1500968724052035e-05, + "loss": 0.0911, + "step": 37295 + }, + { + "epoch": 3.65, + "learning_rate": 1.1496817049543316e-05, + "loss": 0.1177, + "step": 37300 + }, + { + "epoch": 3.65, + "learning_rate": 1.1492665375034598e-05, + "loss": 0.1017, + "step": 37305 + }, + { + "epoch": 3.65, + "learning_rate": 1.1488513700525879e-05, + "loss": 0.0968, + "step": 37310 + }, + { + "epoch": 3.65, + "learning_rate": 1.148436202601716e-05, + "loss": 0.1135, + "step": 37315 + }, + { + "epoch": 3.65, + "learning_rate": 1.1480210351508442e-05, + "loss": 0.1198, + "step": 37320 + }, + { + "epoch": 3.65, + "learning_rate": 1.1476058676999723e-05, + "loss": 0.0948, + "step": 37325 + }, + { + "epoch": 3.65, + "learning_rate": 1.1471907002491006e-05, + "loss": 0.1034, + "step": 37330 + }, + { + "epoch": 3.65, + "learning_rate": 1.1467755327982286e-05, + "loss": 0.1092, + "step": 37335 + }, + { + "epoch": 3.65, + "learning_rate": 1.1463603653473567e-05, + "loss": 0.0882, + "step": 37340 + }, + { + "epoch": 3.65, + "learning_rate": 1.145945197896485e-05, + "loss": 0.0862, + "step": 37345 + }, + { + "epoch": 3.65, + "learning_rate": 1.1455300304456132e-05, + "loss": 0.1083, + "step": 37350 + }, + { + "epoch": 3.65, + "learning_rate": 1.1451148629947413e-05, + "loss": 0.099, + "step": 37355 + }, + { + "epoch": 3.65, + "learning_rate": 1.1446996955438694e-05, + "loss": 0.091, + "step": 37360 + }, + { + "epoch": 3.65, + "learning_rate": 1.1442845280929974e-05, + "loss": 0.1209, + "step": 37365 + }, + { + "epoch": 3.65, + "learning_rate": 1.1438693606421257e-05, + "loss": 0.1232, + "step": 37370 + }, + { + "epoch": 3.65, + "learning_rate": 1.143454193191254e-05, + "loss": 0.0995, + "step": 37375 + }, + { + "epoch": 3.66, + "learning_rate": 1.143039025740382e-05, + "loss": 0.1011, + "step": 37380 + }, + { + "epoch": 3.66, + "learning_rate": 1.14262385828951e-05, + "loss": 0.1071, + "step": 37385 + }, + { + "epoch": 3.66, + "learning_rate": 1.1422086908386382e-05, + "loss": 0.0854, + "step": 37390 + }, + { + "epoch": 3.66, + "learning_rate": 1.1417935233877666e-05, + "loss": 0.0908, + "step": 37395 + }, + { + "epoch": 3.66, + "learning_rate": 1.1413783559368946e-05, + "loss": 0.1179, + "step": 37400 + }, + { + "epoch": 3.66, + "learning_rate": 1.1409631884860227e-05, + "loss": 0.1024, + "step": 37405 + }, + { + "epoch": 3.66, + "learning_rate": 1.1405480210351508e-05, + "loss": 0.1035, + "step": 37410 + }, + { + "epoch": 3.66, + "learning_rate": 1.140132853584279e-05, + "loss": 0.1126, + "step": 37415 + }, + { + "epoch": 3.66, + "learning_rate": 1.1397176861334073e-05, + "loss": 0.1065, + "step": 37420 + }, + { + "epoch": 3.66, + "learning_rate": 1.1393025186825354e-05, + "loss": 0.1003, + "step": 37425 + }, + { + "epoch": 3.66, + "learning_rate": 1.1388873512316634e-05, + "loss": 0.0974, + "step": 37430 + }, + { + "epoch": 3.66, + "learning_rate": 1.1384721837807915e-05, + "loss": 0.1264, + "step": 37435 + }, + { + "epoch": 3.66, + "learning_rate": 1.1380570163299198e-05, + "loss": 0.0973, + "step": 37440 + }, + { + "epoch": 3.66, + "learning_rate": 1.137641848879048e-05, + "loss": 0.0844, + "step": 37445 + }, + { + "epoch": 3.66, + "learning_rate": 1.1372266814281761e-05, + "loss": 0.1139, + "step": 37450 + }, + { + "epoch": 3.66, + "learning_rate": 1.1368115139773042e-05, + "loss": 0.097, + "step": 37455 + }, + { + "epoch": 3.66, + "learning_rate": 1.1363963465264324e-05, + "loss": 0.1032, + "step": 37460 + }, + { + "epoch": 3.66, + "learning_rate": 1.1359811790755605e-05, + "loss": 0.1115, + "step": 37465 + }, + { + "epoch": 3.66, + "learning_rate": 1.1355660116246886e-05, + "loss": 0.1023, + "step": 37470 + }, + { + "epoch": 3.66, + "learning_rate": 1.1351508441738168e-05, + "loss": 0.0948, + "step": 37475 + }, + { + "epoch": 3.66, + "learning_rate": 1.1347356767229449e-05, + "loss": 0.1012, + "step": 37480 + }, + { + "epoch": 3.67, + "learning_rate": 1.1343205092720731e-05, + "loss": 0.1147, + "step": 37485 + }, + { + "epoch": 3.67, + "learning_rate": 1.1339053418212012e-05, + "loss": 0.0929, + "step": 37490 + }, + { + "epoch": 3.67, + "learning_rate": 1.1334901743703293e-05, + "loss": 0.0918, + "step": 37495 + }, + { + "epoch": 3.67, + "learning_rate": 1.1330750069194575e-05, + "loss": 0.1303, + "step": 37500 + }, + { + "epoch": 3.67, + "eval_cer": 0.05594363552700644, + "eval_loss": 0.22809739410877228, + "eval_runtime": 274.0616, + "eval_samples_per_second": 59.731, + "eval_steps_per_second": 1.66, + "eval_wer": 0.1434606870702546, + "step": 37500 + }, + { + "epoch": 3.67, + "learning_rate": 1.1326598394685858e-05, + "loss": 0.1031, + "step": 37505 + }, + { + "epoch": 3.67, + "learning_rate": 1.1322446720177139e-05, + "loss": 0.0965, + "step": 37510 + }, + { + "epoch": 3.67, + "learning_rate": 1.131829504566842e-05, + "loss": 0.1163, + "step": 37515 + }, + { + "epoch": 3.67, + "learning_rate": 1.13141433711597e-05, + "loss": 0.1075, + "step": 37520 + }, + { + "epoch": 3.67, + "learning_rate": 1.1309991696650984e-05, + "loss": 0.1006, + "step": 37525 + }, + { + "epoch": 3.67, + "learning_rate": 1.1305840022142265e-05, + "loss": 0.104, + "step": 37530 + }, + { + "epoch": 3.67, + "learning_rate": 1.1301688347633546e-05, + "loss": 0.1154, + "step": 37535 + }, + { + "epoch": 3.67, + "learning_rate": 1.1297536673124827e-05, + "loss": 0.0851, + "step": 37540 + }, + { + "epoch": 3.67, + "learning_rate": 1.1293384998616107e-05, + "loss": 0.0941, + "step": 37545 + }, + { + "epoch": 3.67, + "learning_rate": 1.1289233324107392e-05, + "loss": 0.1189, + "step": 37550 + }, + { + "epoch": 3.67, + "learning_rate": 1.1285081649598672e-05, + "loss": 0.0969, + "step": 37555 + }, + { + "epoch": 3.67, + "learning_rate": 1.1280929975089953e-05, + "loss": 0.0922, + "step": 37560 + }, + { + "epoch": 3.67, + "learning_rate": 1.1276778300581234e-05, + "loss": 0.1091, + "step": 37565 + }, + { + "epoch": 3.67, + "learning_rate": 1.1272626626072516e-05, + "loss": 0.1131, + "step": 37570 + }, + { + "epoch": 3.67, + "learning_rate": 1.1268474951563799e-05, + "loss": 0.0983, + "step": 37575 + }, + { + "epoch": 3.67, + "learning_rate": 1.126432327705508e-05, + "loss": 0.1134, + "step": 37580 + }, + { + "epoch": 3.68, + "learning_rate": 1.126017160254636e-05, + "loss": 0.1143, + "step": 37585 + }, + { + "epoch": 3.68, + "learning_rate": 1.1256019928037641e-05, + "loss": 0.0995, + "step": 37590 + }, + { + "epoch": 3.68, + "learning_rate": 1.1251868253528924e-05, + "loss": 0.0888, + "step": 37595 + }, + { + "epoch": 3.68, + "learning_rate": 1.1247716579020206e-05, + "loss": 0.1207, + "step": 37600 + }, + { + "epoch": 3.68, + "learning_rate": 1.1243564904511487e-05, + "loss": 0.0897, + "step": 37605 + }, + { + "epoch": 3.68, + "learning_rate": 1.1239413230002768e-05, + "loss": 0.1069, + "step": 37610 + }, + { + "epoch": 3.68, + "learning_rate": 1.123526155549405e-05, + "loss": 0.1276, + "step": 37615 + }, + { + "epoch": 3.68, + "learning_rate": 1.123110988098533e-05, + "loss": 0.1184, + "step": 37620 + }, + { + "epoch": 3.68, + "learning_rate": 1.1226958206476613e-05, + "loss": 0.0997, + "step": 37625 + }, + { + "epoch": 3.68, + "learning_rate": 1.1222806531967894e-05, + "loss": 0.0927, + "step": 37630 + }, + { + "epoch": 3.68, + "learning_rate": 1.1218654857459176e-05, + "loss": 0.1162, + "step": 37635 + }, + { + "epoch": 3.68, + "learning_rate": 1.1214503182950457e-05, + "loss": 0.0963, + "step": 37640 + }, + { + "epoch": 3.68, + "learning_rate": 1.1210351508441738e-05, + "loss": 0.1033, + "step": 37645 + }, + { + "epoch": 3.68, + "learning_rate": 1.120619983393302e-05, + "loss": 0.1237, + "step": 37650 + }, + { + "epoch": 3.68, + "learning_rate": 1.1202048159424301e-05, + "loss": 0.0969, + "step": 37655 + }, + { + "epoch": 3.68, + "learning_rate": 1.1197896484915584e-05, + "loss": 0.0884, + "step": 37660 + }, + { + "epoch": 3.68, + "learning_rate": 1.1193744810406864e-05, + "loss": 0.0993, + "step": 37665 + }, + { + "epoch": 3.68, + "learning_rate": 1.1189593135898145e-05, + "loss": 0.0975, + "step": 37670 + }, + { + "epoch": 3.68, + "learning_rate": 1.1185441461389426e-05, + "loss": 0.1025, + "step": 37675 + }, + { + "epoch": 3.68, + "learning_rate": 1.118128978688071e-05, + "loss": 0.1015, + "step": 37680 + }, + { + "epoch": 3.68, + "learning_rate": 1.1177138112371991e-05, + "loss": 0.1204, + "step": 37685 + }, + { + "epoch": 3.69, + "learning_rate": 1.1172986437863272e-05, + "loss": 0.1027, + "step": 37690 + }, + { + "epoch": 3.69, + "learning_rate": 1.1168834763354552e-05, + "loss": 0.1079, + "step": 37695 + }, + { + "epoch": 3.69, + "learning_rate": 1.1164683088845833e-05, + "loss": 0.1248, + "step": 37700 + }, + { + "epoch": 3.69, + "learning_rate": 1.1160531414337117e-05, + "loss": 0.0924, + "step": 37705 + }, + { + "epoch": 3.69, + "learning_rate": 1.1156379739828398e-05, + "loss": 0.1087, + "step": 37710 + }, + { + "epoch": 3.69, + "learning_rate": 1.1152228065319679e-05, + "loss": 0.117, + "step": 37715 + }, + { + "epoch": 3.69, + "learning_rate": 1.114807639081096e-05, + "loss": 0.0941, + "step": 37720 + }, + { + "epoch": 3.69, + "learning_rate": 1.1143924716302242e-05, + "loss": 0.1003, + "step": 37725 + }, + { + "epoch": 3.69, + "learning_rate": 1.1139773041793525e-05, + "loss": 0.0999, + "step": 37730 + }, + { + "epoch": 3.69, + "learning_rate": 1.1135621367284805e-05, + "loss": 0.1153, + "step": 37735 + }, + { + "epoch": 3.69, + "learning_rate": 1.1131469692776086e-05, + "loss": 0.1032, + "step": 37740 + }, + { + "epoch": 3.69, + "learning_rate": 1.1127318018267369e-05, + "loss": 0.0913, + "step": 37745 + }, + { + "epoch": 3.69, + "learning_rate": 1.112316634375865e-05, + "loss": 0.1083, + "step": 37750 + }, + { + "epoch": 3.69, + "learning_rate": 1.1119014669249932e-05, + "loss": 0.088, + "step": 37755 + }, + { + "epoch": 3.69, + "learning_rate": 1.1114862994741213e-05, + "loss": 0.0972, + "step": 37760 + }, + { + "epoch": 3.69, + "learning_rate": 1.1110711320232493e-05, + "loss": 0.0996, + "step": 37765 + }, + { + "epoch": 3.69, + "learning_rate": 1.1106559645723776e-05, + "loss": 0.0998, + "step": 37770 + }, + { + "epoch": 3.69, + "learning_rate": 1.1102407971215057e-05, + "loss": 0.0988, + "step": 37775 + }, + { + "epoch": 3.69, + "learning_rate": 1.1098256296706339e-05, + "loss": 0.1009, + "step": 37780 + }, + { + "epoch": 3.69, + "learning_rate": 1.109410462219762e-05, + "loss": 0.1235, + "step": 37785 + }, + { + "epoch": 3.7, + "learning_rate": 1.1089952947688902e-05, + "loss": 0.1034, + "step": 37790 + }, + { + "epoch": 3.7, + "learning_rate": 1.1085801273180183e-05, + "loss": 0.0895, + "step": 37795 + }, + { + "epoch": 3.7, + "learning_rate": 1.1081649598671464e-05, + "loss": 0.1291, + "step": 37800 + }, + { + "epoch": 3.7, + "learning_rate": 1.1077497924162746e-05, + "loss": 0.0945, + "step": 37805 + }, + { + "epoch": 3.7, + "learning_rate": 1.1073346249654027e-05, + "loss": 0.0967, + "step": 37810 + }, + { + "epoch": 3.7, + "learning_rate": 1.106919457514531e-05, + "loss": 0.1274, + "step": 37815 + }, + { + "epoch": 3.7, + "learning_rate": 1.106504290063659e-05, + "loss": 0.1101, + "step": 37820 + }, + { + "epoch": 3.7, + "learning_rate": 1.1060891226127871e-05, + "loss": 0.0893, + "step": 37825 + }, + { + "epoch": 3.7, + "learning_rate": 1.1056739551619154e-05, + "loss": 0.0948, + "step": 37830 + }, + { + "epoch": 3.7, + "learning_rate": 1.1052587877110436e-05, + "loss": 0.1091, + "step": 37835 + }, + { + "epoch": 3.7, + "learning_rate": 1.1048436202601717e-05, + "loss": 0.0981, + "step": 37840 + }, + { + "epoch": 3.7, + "learning_rate": 1.1044284528092998e-05, + "loss": 0.0864, + "step": 37845 + }, + { + "epoch": 3.7, + "learning_rate": 1.1040132853584278e-05, + "loss": 0.112, + "step": 37850 + }, + { + "epoch": 3.7, + "learning_rate": 1.103598117907556e-05, + "loss": 0.103, + "step": 37855 + }, + { + "epoch": 3.7, + "learning_rate": 1.1031829504566843e-05, + "loss": 0.0973, + "step": 37860 + }, + { + "epoch": 3.7, + "learning_rate": 1.1027677830058124e-05, + "loss": 0.1238, + "step": 37865 + }, + { + "epoch": 3.7, + "learning_rate": 1.1023526155549405e-05, + "loss": 0.1076, + "step": 37870 + }, + { + "epoch": 3.7, + "learning_rate": 1.1019374481040686e-05, + "loss": 0.0903, + "step": 37875 + }, + { + "epoch": 3.7, + "learning_rate": 1.1015222806531968e-05, + "loss": 0.0896, + "step": 37880 + }, + { + "epoch": 3.7, + "learning_rate": 1.101107113202325e-05, + "loss": 0.0972, + "step": 37885 + }, + { + "epoch": 3.71, + "learning_rate": 1.1006919457514531e-05, + "loss": 0.0971, + "step": 37890 + }, + { + "epoch": 3.71, + "learning_rate": 1.1002767783005812e-05, + "loss": 0.0897, + "step": 37895 + }, + { + "epoch": 3.71, + "learning_rate": 1.0998616108497094e-05, + "loss": 0.1263, + "step": 37900 + }, + { + "epoch": 3.71, + "learning_rate": 1.0994464433988375e-05, + "loss": 0.0947, + "step": 37905 + }, + { + "epoch": 3.71, + "learning_rate": 1.0990312759479658e-05, + "loss": 0.0962, + "step": 37910 + }, + { + "epoch": 3.71, + "learning_rate": 1.0986161084970938e-05, + "loss": 0.1196, + "step": 37915 + }, + { + "epoch": 3.71, + "learning_rate": 1.098200941046222e-05, + "loss": 0.0993, + "step": 37920 + }, + { + "epoch": 3.71, + "learning_rate": 1.0977857735953502e-05, + "loss": 0.0916, + "step": 37925 + }, + { + "epoch": 3.71, + "learning_rate": 1.0973706061444782e-05, + "loss": 0.0903, + "step": 37930 + }, + { + "epoch": 3.71, + "learning_rate": 1.0969554386936065e-05, + "loss": 0.1046, + "step": 37935 + }, + { + "epoch": 3.71, + "learning_rate": 1.0965402712427346e-05, + "loss": 0.0886, + "step": 37940 + }, + { + "epoch": 3.71, + "learning_rate": 1.0961251037918628e-05, + "loss": 0.1014, + "step": 37945 + }, + { + "epoch": 3.71, + "learning_rate": 1.0957099363409909e-05, + "loss": 0.1263, + "step": 37950 + }, + { + "epoch": 3.71, + "learning_rate": 1.095294768890119e-05, + "loss": 0.0977, + "step": 37955 + }, + { + "epoch": 3.71, + "learning_rate": 1.0948796014392472e-05, + "loss": 0.0934, + "step": 37960 + }, + { + "epoch": 3.71, + "learning_rate": 1.0944644339883753e-05, + "loss": 0.0957, + "step": 37965 + }, + { + "epoch": 3.71, + "learning_rate": 1.0940492665375035e-05, + "loss": 0.1152, + "step": 37970 + }, + { + "epoch": 3.71, + "learning_rate": 1.0936340990866316e-05, + "loss": 0.1029, + "step": 37975 + }, + { + "epoch": 3.71, + "learning_rate": 1.0932189316357597e-05, + "loss": 0.1088, + "step": 37980 + }, + { + "epoch": 3.71, + "learning_rate": 1.092803764184888e-05, + "loss": 0.1033, + "step": 37985 + }, + { + "epoch": 3.71, + "learning_rate": 1.0923885967340162e-05, + "loss": 0.0876, + "step": 37990 + }, + { + "epoch": 3.72, + "learning_rate": 1.0919734292831443e-05, + "loss": 0.0985, + "step": 37995 + }, + { + "epoch": 3.72, + "learning_rate": 1.0915582618322723e-05, + "loss": 0.1193, + "step": 38000 + }, + { + "epoch": 3.72, + "eval_cer": 0.05629510418039591, + "eval_loss": 0.23056894540786743, + "eval_runtime": 272.602, + "eval_samples_per_second": 60.051, + "eval_steps_per_second": 1.669, + "eval_wer": 0.1437871793030044, + "step": 38000 + }, + { + "epoch": 3.72, + "learning_rate": 1.0911430943814004e-05, + "loss": 0.1036, + "step": 38005 + }, + { + "epoch": 3.72, + "learning_rate": 1.0907279269305288e-05, + "loss": 0.0951, + "step": 38010 + }, + { + "epoch": 3.72, + "learning_rate": 1.0903127594796569e-05, + "loss": 0.126, + "step": 38015 + }, + { + "epoch": 3.72, + "learning_rate": 1.089897592028785e-05, + "loss": 0.1091, + "step": 38020 + }, + { + "epoch": 3.72, + "learning_rate": 1.089482424577913e-05, + "loss": 0.0921, + "step": 38025 + }, + { + "epoch": 3.72, + "learning_rate": 1.0890672571270411e-05, + "loss": 0.0988, + "step": 38030 + }, + { + "epoch": 3.72, + "learning_rate": 1.0886520896761696e-05, + "loss": 0.1059, + "step": 38035 + }, + { + "epoch": 3.72, + "learning_rate": 1.0882369222252976e-05, + "loss": 0.0978, + "step": 38040 + }, + { + "epoch": 3.72, + "learning_rate": 1.0878217547744257e-05, + "loss": 0.0901, + "step": 38045 + }, + { + "epoch": 3.72, + "learning_rate": 1.0874065873235538e-05, + "loss": 0.1081, + "step": 38050 + }, + { + "epoch": 3.72, + "learning_rate": 1.086991419872682e-05, + "loss": 0.0965, + "step": 38055 + }, + { + "epoch": 3.72, + "learning_rate": 1.0865762524218103e-05, + "loss": 0.0967, + "step": 38060 + }, + { + "epoch": 3.72, + "learning_rate": 1.0861610849709384e-05, + "loss": 0.1168, + "step": 38065 + }, + { + "epoch": 3.72, + "learning_rate": 1.0857459175200664e-05, + "loss": 0.111, + "step": 38070 + }, + { + "epoch": 3.72, + "learning_rate": 1.0853307500691945e-05, + "loss": 0.103, + "step": 38075 + }, + { + "epoch": 3.72, + "learning_rate": 1.0849155826183228e-05, + "loss": 0.0988, + "step": 38080 + }, + { + "epoch": 3.72, + "learning_rate": 1.0845004151674508e-05, + "loss": 0.1293, + "step": 38085 + }, + { + "epoch": 3.72, + "learning_rate": 1.084085247716579e-05, + "loss": 0.0957, + "step": 38090 + }, + { + "epoch": 3.73, + "learning_rate": 1.0836700802657072e-05, + "loss": 0.0958, + "step": 38095 + }, + { + "epoch": 3.73, + "learning_rate": 1.0832549128148354e-05, + "loss": 0.1214, + "step": 38100 + }, + { + "epoch": 3.73, + "learning_rate": 1.0828397453639635e-05, + "loss": 0.1047, + "step": 38105 + }, + { + "epoch": 3.73, + "learning_rate": 1.0824245779130916e-05, + "loss": 0.1153, + "step": 38110 + }, + { + "epoch": 3.73, + "learning_rate": 1.0820094104622198e-05, + "loss": 0.1056, + "step": 38115 + }, + { + "epoch": 3.73, + "learning_rate": 1.081594243011348e-05, + "loss": 0.103, + "step": 38120 + }, + { + "epoch": 3.73, + "learning_rate": 1.0811790755604761e-05, + "loss": 0.0931, + "step": 38125 + }, + { + "epoch": 3.73, + "learning_rate": 1.0807639081096042e-05, + "loss": 0.1044, + "step": 38130 + }, + { + "epoch": 3.73, + "learning_rate": 1.0803487406587323e-05, + "loss": 0.1129, + "step": 38135 + }, + { + "epoch": 3.73, + "learning_rate": 1.0799335732078605e-05, + "loss": 0.0994, + "step": 38140 + }, + { + "epoch": 3.73, + "learning_rate": 1.0795184057569888e-05, + "loss": 0.0969, + "step": 38145 + }, + { + "epoch": 3.73, + "learning_rate": 1.0791032383061168e-05, + "loss": 0.0988, + "step": 38150 + }, + { + "epoch": 3.73, + "learning_rate": 1.078688070855245e-05, + "loss": 0.0959, + "step": 38155 + }, + { + "epoch": 3.73, + "learning_rate": 1.078272903404373e-05, + "loss": 0.082, + "step": 38160 + }, + { + "epoch": 3.73, + "learning_rate": 1.0778577359535014e-05, + "loss": 0.1166, + "step": 38165 + }, + { + "epoch": 3.73, + "learning_rate": 1.0774425685026295e-05, + "loss": 0.1085, + "step": 38170 + }, + { + "epoch": 3.73, + "learning_rate": 1.0770274010517576e-05, + "loss": 0.0877, + "step": 38175 + }, + { + "epoch": 3.73, + "learning_rate": 1.0766122336008856e-05, + "loss": 0.0893, + "step": 38180 + }, + { + "epoch": 3.73, + "learning_rate": 1.0761970661500137e-05, + "loss": 0.1274, + "step": 38185 + }, + { + "epoch": 3.73, + "learning_rate": 1.0757818986991421e-05, + "loss": 0.096, + "step": 38190 + }, + { + "epoch": 3.73, + "learning_rate": 1.0753667312482702e-05, + "loss": 0.0925, + "step": 38195 + }, + { + "epoch": 3.74, + "learning_rate": 1.0749515637973983e-05, + "loss": 0.1251, + "step": 38200 + }, + { + "epoch": 3.74, + "learning_rate": 1.0745363963465264e-05, + "loss": 0.0987, + "step": 38205 + }, + { + "epoch": 3.74, + "learning_rate": 1.0741212288956546e-05, + "loss": 0.0948, + "step": 38210 + }, + { + "epoch": 3.74, + "learning_rate": 1.0737060614447829e-05, + "loss": 0.1198, + "step": 38215 + }, + { + "epoch": 3.74, + "learning_rate": 1.073290893993911e-05, + "loss": 0.1022, + "step": 38220 + }, + { + "epoch": 3.74, + "learning_rate": 1.072875726543039e-05, + "loss": 0.0935, + "step": 38225 + }, + { + "epoch": 3.74, + "learning_rate": 1.0724605590921673e-05, + "loss": 0.0909, + "step": 38230 + }, + { + "epoch": 3.74, + "learning_rate": 1.0720453916412953e-05, + "loss": 0.1018, + "step": 38235 + }, + { + "epoch": 3.74, + "learning_rate": 1.0716302241904236e-05, + "loss": 0.104, + "step": 38240 + }, + { + "epoch": 3.74, + "learning_rate": 1.0712150567395517e-05, + "loss": 0.0948, + "step": 38245 + }, + { + "epoch": 3.74, + "learning_rate": 1.0707998892886797e-05, + "loss": 0.1113, + "step": 38250 + }, + { + "epoch": 3.74, + "learning_rate": 1.070384721837808e-05, + "loss": 0.095, + "step": 38255 + }, + { + "epoch": 3.74, + "learning_rate": 1.069969554386936e-05, + "loss": 0.1043, + "step": 38260 + }, + { + "epoch": 3.74, + "learning_rate": 1.0695543869360643e-05, + "loss": 0.1122, + "step": 38265 + }, + { + "epoch": 3.74, + "learning_rate": 1.0691392194851924e-05, + "loss": 0.1038, + "step": 38270 + }, + { + "epoch": 3.74, + "learning_rate": 1.0687240520343206e-05, + "loss": 0.0933, + "step": 38275 + }, + { + "epoch": 3.74, + "learning_rate": 1.0683088845834487e-05, + "loss": 0.1112, + "step": 38280 + }, + { + "epoch": 3.74, + "learning_rate": 1.0678937171325768e-05, + "loss": 0.1112, + "step": 38285 + }, + { + "epoch": 3.74, + "learning_rate": 1.0674785496817049e-05, + "loss": 0.0874, + "step": 38290 + }, + { + "epoch": 3.74, + "learning_rate": 1.0670633822308331e-05, + "loss": 0.0877, + "step": 38295 + }, + { + "epoch": 3.75, + "learning_rate": 1.0666482147799614e-05, + "loss": 0.1216, + "step": 38300 + }, + { + "epoch": 3.75, + "learning_rate": 1.0662330473290894e-05, + "loss": 0.0942, + "step": 38305 + }, + { + "epoch": 3.75, + "learning_rate": 1.0658178798782175e-05, + "loss": 0.1108, + "step": 38310 + }, + { + "epoch": 3.75, + "learning_rate": 1.0654027124273456e-05, + "loss": 0.1066, + "step": 38315 + }, + { + "epoch": 3.75, + "learning_rate": 1.064987544976474e-05, + "loss": 0.0959, + "step": 38320 + }, + { + "epoch": 3.75, + "learning_rate": 1.064572377525602e-05, + "loss": 0.0885, + "step": 38325 + }, + { + "epoch": 3.75, + "learning_rate": 1.0641572100747302e-05, + "loss": 0.1122, + "step": 38330 + }, + { + "epoch": 3.75, + "learning_rate": 1.0637420426238582e-05, + "loss": 0.1103, + "step": 38335 + }, + { + "epoch": 3.75, + "learning_rate": 1.0633268751729865e-05, + "loss": 0.0903, + "step": 38340 + }, + { + "epoch": 3.75, + "learning_rate": 1.0629117077221147e-05, + "loss": 0.1043, + "step": 38345 + }, + { + "epoch": 3.75, + "learning_rate": 1.0624965402712428e-05, + "loss": 0.1135, + "step": 38350 + }, + { + "epoch": 3.75, + "learning_rate": 1.0620813728203709e-05, + "loss": 0.0914, + "step": 38355 + }, + { + "epoch": 3.75, + "learning_rate": 1.061666205369499e-05, + "loss": 0.0905, + "step": 38360 + }, + { + "epoch": 3.75, + "learning_rate": 1.0612510379186272e-05, + "loss": 0.1119, + "step": 38365 + }, + { + "epoch": 3.75, + "learning_rate": 1.0608358704677554e-05, + "loss": 0.1036, + "step": 38370 + }, + { + "epoch": 3.75, + "learning_rate": 1.0604207030168835e-05, + "loss": 0.1023, + "step": 38375 + }, + { + "epoch": 3.75, + "learning_rate": 1.0600055355660116e-05, + "loss": 0.0995, + "step": 38380 + }, + { + "epoch": 3.75, + "learning_rate": 1.0595903681151398e-05, + "loss": 0.1262, + "step": 38385 + }, + { + "epoch": 3.75, + "learning_rate": 1.059175200664268e-05, + "loss": 0.0951, + "step": 38390 + }, + { + "epoch": 3.75, + "learning_rate": 1.0587600332133962e-05, + "loss": 0.0958, + "step": 38395 + }, + { + "epoch": 3.75, + "learning_rate": 1.0583448657625242e-05, + "loss": 0.1315, + "step": 38400 + }, + { + "epoch": 3.76, + "learning_rate": 1.0579296983116523e-05, + "loss": 0.1006, + "step": 38405 + }, + { + "epoch": 3.76, + "learning_rate": 1.0575145308607806e-05, + "loss": 0.0921, + "step": 38410 + }, + { + "epoch": 3.76, + "learning_rate": 1.0570993634099086e-05, + "loss": 0.1225, + "step": 38415 + }, + { + "epoch": 3.76, + "learning_rate": 1.0566841959590369e-05, + "loss": 0.1062, + "step": 38420 + }, + { + "epoch": 3.76, + "learning_rate": 1.056269028508165e-05, + "loss": 0.0953, + "step": 38425 + }, + { + "epoch": 3.76, + "learning_rate": 1.0558538610572932e-05, + "loss": 0.1054, + "step": 38430 + }, + { + "epoch": 3.76, + "learning_rate": 1.0554386936064213e-05, + "loss": 0.1091, + "step": 38435 + }, + { + "epoch": 3.76, + "learning_rate": 1.0550235261555494e-05, + "loss": 0.0822, + "step": 38440 + }, + { + "epoch": 3.76, + "learning_rate": 1.0546083587046776e-05, + "loss": 0.1164, + "step": 38445 + }, + { + "epoch": 3.76, + "learning_rate": 1.0541931912538059e-05, + "loss": 0.116, + "step": 38450 + }, + { + "epoch": 3.76, + "learning_rate": 1.053778023802934e-05, + "loss": 0.1036, + "step": 38455 + }, + { + "epoch": 3.76, + "learning_rate": 1.053362856352062e-05, + "loss": 0.0814, + "step": 38460 + }, + { + "epoch": 3.76, + "learning_rate": 1.0529476889011901e-05, + "loss": 0.121, + "step": 38465 + }, + { + "epoch": 3.76, + "learning_rate": 1.0525325214503183e-05, + "loss": 0.104, + "step": 38470 + }, + { + "epoch": 3.76, + "learning_rate": 1.0521173539994466e-05, + "loss": 0.0904, + "step": 38475 + }, + { + "epoch": 3.76, + "learning_rate": 1.0517021865485747e-05, + "loss": 0.1221, + "step": 38480 + }, + { + "epoch": 3.76, + "learning_rate": 1.0512870190977027e-05, + "loss": 0.1253, + "step": 38485 + }, + { + "epoch": 3.76, + "learning_rate": 1.0508718516468308e-05, + "loss": 0.0891, + "step": 38490 + }, + { + "epoch": 3.76, + "learning_rate": 1.050456684195959e-05, + "loss": 0.1038, + "step": 38495 + }, + { + "epoch": 3.76, + "learning_rate": 1.0500415167450873e-05, + "loss": 0.1148, + "step": 38500 + }, + { + "epoch": 3.76, + "eval_cer": 0.055836113866594525, + "eval_loss": 0.22591058909893036, + "eval_runtime": 274.9325, + "eval_samples_per_second": 59.542, + "eval_steps_per_second": 1.655, + "eval_wer": 0.1439112463514493, + "step": 38500 + }, + { + "epoch": 3.77, + "learning_rate": 1.0496263492942154e-05, + "loss": 0.1152, + "step": 38505 + }, + { + "epoch": 3.77, + "learning_rate": 1.0492111818433435e-05, + "loss": 0.0867, + "step": 38510 + }, + { + "epoch": 3.77, + "learning_rate": 1.0487960143924715e-05, + "loss": 0.1137, + "step": 38515 + }, + { + "epoch": 3.77, + "learning_rate": 1.0483808469415998e-05, + "loss": 0.1066, + "step": 38520 + }, + { + "epoch": 3.77, + "learning_rate": 1.047965679490728e-05, + "loss": 0.09, + "step": 38525 + }, + { + "epoch": 3.77, + "learning_rate": 1.0475505120398561e-05, + "loss": 0.1058, + "step": 38530 + }, + { + "epoch": 3.77, + "learning_rate": 1.0471353445889842e-05, + "loss": 0.1106, + "step": 38535 + }, + { + "epoch": 3.77, + "learning_rate": 1.0467201771381124e-05, + "loss": 0.1056, + "step": 38540 + }, + { + "epoch": 3.77, + "learning_rate": 1.0463050096872405e-05, + "loss": 0.0965, + "step": 38545 + }, + { + "epoch": 3.77, + "learning_rate": 1.0458898422363687e-05, + "loss": 0.1214, + "step": 38550 + }, + { + "epoch": 3.77, + "learning_rate": 1.0454746747854968e-05, + "loss": 0.105, + "step": 38555 + }, + { + "epoch": 3.77, + "learning_rate": 1.045059507334625e-05, + "loss": 0.0915, + "step": 38560 + }, + { + "epoch": 3.77, + "learning_rate": 1.0446443398837531e-05, + "loss": 0.1323, + "step": 38565 + }, + { + "epoch": 3.77, + "learning_rate": 1.0442291724328812e-05, + "loss": 0.088, + "step": 38570 + }, + { + "epoch": 3.77, + "learning_rate": 1.0438140049820095e-05, + "loss": 0.0945, + "step": 38575 + }, + { + "epoch": 3.77, + "learning_rate": 1.0433988375311375e-05, + "loss": 0.0912, + "step": 38580 + }, + { + "epoch": 3.77, + "learning_rate": 1.0429836700802658e-05, + "loss": 0.1223, + "step": 38585 + }, + { + "epoch": 3.77, + "learning_rate": 1.0425685026293939e-05, + "loss": 0.0959, + "step": 38590 + }, + { + "epoch": 3.77, + "learning_rate": 1.042153335178522e-05, + "loss": 0.0963, + "step": 38595 + }, + { + "epoch": 3.77, + "learning_rate": 1.0417381677276502e-05, + "loss": 0.1106, + "step": 38600 + }, + { + "epoch": 3.77, + "learning_rate": 1.0413230002767784e-05, + "loss": 0.1069, + "step": 38605 + }, + { + "epoch": 3.78, + "learning_rate": 1.0409078328259065e-05, + "loss": 0.0924, + "step": 38610 + }, + { + "epoch": 3.78, + "learning_rate": 1.0404926653750346e-05, + "loss": 0.1196, + "step": 38615 + }, + { + "epoch": 3.78, + "learning_rate": 1.0400774979241627e-05, + "loss": 0.1049, + "step": 38620 + }, + { + "epoch": 3.78, + "learning_rate": 1.039662330473291e-05, + "loss": 0.1037, + "step": 38625 + }, + { + "epoch": 3.78, + "learning_rate": 1.0392471630224192e-05, + "loss": 0.1011, + "step": 38630 + }, + { + "epoch": 3.78, + "learning_rate": 1.0388319955715472e-05, + "loss": 0.1127, + "step": 38635 + }, + { + "epoch": 3.78, + "learning_rate": 1.0384168281206753e-05, + "loss": 0.0914, + "step": 38640 + }, + { + "epoch": 3.78, + "learning_rate": 1.0380016606698034e-05, + "loss": 0.1054, + "step": 38645 + }, + { + "epoch": 3.78, + "learning_rate": 1.0375864932189318e-05, + "loss": 0.141, + "step": 38650 + }, + { + "epoch": 3.78, + "learning_rate": 1.0371713257680599e-05, + "loss": 0.0973, + "step": 38655 + }, + { + "epoch": 3.78, + "learning_rate": 1.036756158317188e-05, + "loss": 0.0916, + "step": 38660 + }, + { + "epoch": 3.78, + "learning_rate": 1.036340990866316e-05, + "loss": 0.115, + "step": 38665 + }, + { + "epoch": 3.78, + "learning_rate": 1.0359258234154441e-05, + "loss": 0.0967, + "step": 38670 + }, + { + "epoch": 3.78, + "learning_rate": 1.0355106559645725e-05, + "loss": 0.0957, + "step": 38675 + }, + { + "epoch": 3.78, + "learning_rate": 1.0350954885137006e-05, + "loss": 0.0956, + "step": 38680 + }, + { + "epoch": 3.78, + "learning_rate": 1.0346803210628287e-05, + "loss": 0.1149, + "step": 38685 + }, + { + "epoch": 3.78, + "learning_rate": 1.0342651536119568e-05, + "loss": 0.1004, + "step": 38690 + }, + { + "epoch": 3.78, + "learning_rate": 1.033849986161085e-05, + "loss": 0.0849, + "step": 38695 + }, + { + "epoch": 3.78, + "learning_rate": 1.0334348187102131e-05, + "loss": 0.1196, + "step": 38700 + }, + { + "epoch": 3.78, + "learning_rate": 1.0330196512593413e-05, + "loss": 0.0886, + "step": 38705 + }, + { + "epoch": 3.79, + "learning_rate": 1.0326044838084694e-05, + "loss": 0.0974, + "step": 38710 + }, + { + "epoch": 3.79, + "learning_rate": 1.0321893163575977e-05, + "loss": 0.115, + "step": 38715 + }, + { + "epoch": 3.79, + "learning_rate": 1.0317741489067257e-05, + "loss": 0.1109, + "step": 38720 + }, + { + "epoch": 3.79, + "learning_rate": 1.0313589814558538e-05, + "loss": 0.0982, + "step": 38725 + }, + { + "epoch": 3.79, + "learning_rate": 1.030943814004982e-05, + "loss": 0.0998, + "step": 38730 + }, + { + "epoch": 3.79, + "learning_rate": 1.0305286465541101e-05, + "loss": 0.1206, + "step": 38735 + }, + { + "epoch": 3.79, + "learning_rate": 1.0301134791032384e-05, + "loss": 0.0896, + "step": 38740 + }, + { + "epoch": 3.79, + "learning_rate": 1.0296983116523665e-05, + "loss": 0.0869, + "step": 38745 + }, + { + "epoch": 3.79, + "learning_rate": 1.0292831442014945e-05, + "loss": 0.1138, + "step": 38750 + }, + { + "epoch": 3.79, + "learning_rate": 1.0288679767506228e-05, + "loss": 0.0955, + "step": 38755 + }, + { + "epoch": 3.79, + "learning_rate": 1.028452809299751e-05, + "loss": 0.0993, + "step": 38760 + }, + { + "epoch": 3.79, + "learning_rate": 1.0280376418488791e-05, + "loss": 0.1111, + "step": 38765 + }, + { + "epoch": 3.79, + "learning_rate": 1.0276224743980072e-05, + "loss": 0.0918, + "step": 38770 + }, + { + "epoch": 3.79, + "learning_rate": 1.0272073069471353e-05, + "loss": 0.0877, + "step": 38775 + }, + { + "epoch": 3.79, + "learning_rate": 1.0267921394962635e-05, + "loss": 0.1118, + "step": 38780 + }, + { + "epoch": 3.79, + "learning_rate": 1.0263769720453917e-05, + "loss": 0.1223, + "step": 38785 + }, + { + "epoch": 3.79, + "learning_rate": 1.0259618045945198e-05, + "loss": 0.0997, + "step": 38790 + }, + { + "epoch": 3.79, + "learning_rate": 1.0255466371436479e-05, + "loss": 0.1071, + "step": 38795 + }, + { + "epoch": 3.79, + "learning_rate": 1.025131469692776e-05, + "loss": 0.1149, + "step": 38800 + }, + { + "epoch": 3.79, + "learning_rate": 1.0247163022419044e-05, + "loss": 0.0928, + "step": 38805 + }, + { + "epoch": 3.79, + "learning_rate": 1.0243011347910325e-05, + "loss": 0.1034, + "step": 38810 + }, + { + "epoch": 3.8, + "learning_rate": 1.0238859673401605e-05, + "loss": 0.1162, + "step": 38815 + }, + { + "epoch": 3.8, + "learning_rate": 1.0234707998892886e-05, + "loss": 0.1068, + "step": 38820 + }, + { + "epoch": 3.8, + "learning_rate": 1.0230556324384169e-05, + "loss": 0.0996, + "step": 38825 + }, + { + "epoch": 3.8, + "learning_rate": 1.0226404649875451e-05, + "loss": 0.0953, + "step": 38830 + }, + { + "epoch": 3.8, + "learning_rate": 1.0222252975366732e-05, + "loss": 0.1213, + "step": 38835 + }, + { + "epoch": 3.8, + "learning_rate": 1.0218101300858013e-05, + "loss": 0.1056, + "step": 38840 + }, + { + "epoch": 3.8, + "learning_rate": 1.0213949626349293e-05, + "loss": 0.0859, + "step": 38845 + }, + { + "epoch": 3.8, + "learning_rate": 1.0209797951840576e-05, + "loss": 0.1059, + "step": 38850 + }, + { + "epoch": 3.8, + "learning_rate": 1.0205646277331858e-05, + "loss": 0.1081, + "step": 38855 + }, + { + "epoch": 3.8, + "learning_rate": 1.020149460282314e-05, + "loss": 0.1093, + "step": 38860 + }, + { + "epoch": 3.8, + "learning_rate": 1.019734292831442e-05, + "loss": 0.1206, + "step": 38865 + }, + { + "epoch": 3.8, + "learning_rate": 1.0193191253805702e-05, + "loss": 0.0955, + "step": 38870 + }, + { + "epoch": 3.8, + "learning_rate": 1.0189039579296983e-05, + "loss": 0.0903, + "step": 38875 + }, + { + "epoch": 3.8, + "learning_rate": 1.0184887904788266e-05, + "loss": 0.0936, + "step": 38880 + }, + { + "epoch": 3.8, + "learning_rate": 1.0180736230279546e-05, + "loss": 0.1171, + "step": 38885 + }, + { + "epoch": 3.8, + "learning_rate": 1.0176584555770827e-05, + "loss": 0.0905, + "step": 38890 + }, + { + "epoch": 3.8, + "learning_rate": 1.017243288126211e-05, + "loss": 0.0895, + "step": 38895 + }, + { + "epoch": 3.8, + "learning_rate": 1.016828120675339e-05, + "loss": 0.1083, + "step": 38900 + }, + { + "epoch": 3.8, + "learning_rate": 1.0164129532244671e-05, + "loss": 0.0933, + "step": 38905 + }, + { + "epoch": 3.8, + "learning_rate": 1.0159977857735954e-05, + "loss": 0.0933, + "step": 38910 + }, + { + "epoch": 3.81, + "learning_rate": 1.0155826183227236e-05, + "loss": 0.1102, + "step": 38915 + }, + { + "epoch": 3.81, + "learning_rate": 1.0151674508718517e-05, + "loss": 0.0933, + "step": 38920 + }, + { + "epoch": 3.81, + "learning_rate": 1.0147522834209798e-05, + "loss": 0.0831, + "step": 38925 + }, + { + "epoch": 3.81, + "learning_rate": 1.0143371159701078e-05, + "loss": 0.0914, + "step": 38930 + }, + { + "epoch": 3.81, + "learning_rate": 1.0139219485192363e-05, + "loss": 0.1047, + "step": 38935 + }, + { + "epoch": 3.81, + "learning_rate": 1.0135067810683643e-05, + "loss": 0.092, + "step": 38940 + }, + { + "epoch": 3.81, + "learning_rate": 1.0130916136174924e-05, + "loss": 0.088, + "step": 38945 + }, + { + "epoch": 3.81, + "learning_rate": 1.0126764461666205e-05, + "loss": 0.1135, + "step": 38950 + }, + { + "epoch": 3.81, + "learning_rate": 1.0122612787157486e-05, + "loss": 0.089, + "step": 38955 + }, + { + "epoch": 3.81, + "learning_rate": 1.011846111264877e-05, + "loss": 0.1051, + "step": 38960 + }, + { + "epoch": 3.81, + "learning_rate": 1.011430943814005e-05, + "loss": 0.1131, + "step": 38965 + }, + { + "epoch": 3.81, + "learning_rate": 1.0110157763631331e-05, + "loss": 0.0964, + "step": 38970 + }, + { + "epoch": 3.81, + "learning_rate": 1.0106006089122612e-05, + "loss": 0.1032, + "step": 38975 + }, + { + "epoch": 3.81, + "learning_rate": 1.0101854414613895e-05, + "loss": 0.0983, + "step": 38980 + }, + { + "epoch": 3.81, + "learning_rate": 1.0097702740105177e-05, + "loss": 0.1188, + "step": 38985 + }, + { + "epoch": 3.81, + "learning_rate": 1.0093551065596458e-05, + "loss": 0.1007, + "step": 38990 + }, + { + "epoch": 3.81, + "learning_rate": 1.0089399391087739e-05, + "loss": 0.0971, + "step": 38995 + }, + { + "epoch": 3.81, + "learning_rate": 1.008524771657902e-05, + "loss": 0.1066, + "step": 39000 + }, + { + "epoch": 3.81, + "eval_cer": 0.05576212046588095, + "eval_loss": 0.22931820154190063, + "eval_runtime": 272.1941, + "eval_samples_per_second": 60.141, + "eval_steps_per_second": 1.672, + "eval_wer": 0.14214165844994547, + "step": 39000 + }, + { + "epoch": 3.81, + "learning_rate": 1.0081096042070302e-05, + "loss": 0.1025, + "step": 39005 + }, + { + "epoch": 3.81, + "learning_rate": 1.0076944367561584e-05, + "loss": 0.0979, + "step": 39010 + }, + { + "epoch": 3.82, + "learning_rate": 1.0072792693052865e-05, + "loss": 0.1181, + "step": 39015 + }, + { + "epoch": 3.82, + "learning_rate": 1.0068641018544146e-05, + "loss": 0.1076, + "step": 39020 + }, + { + "epoch": 3.82, + "learning_rate": 1.0064489344035428e-05, + "loss": 0.099, + "step": 39025 + }, + { + "epoch": 3.82, + "learning_rate": 1.0060337669526709e-05, + "loss": 0.0978, + "step": 39030 + }, + { + "epoch": 3.82, + "learning_rate": 1.0056185995017991e-05, + "loss": 0.1182, + "step": 39035 + }, + { + "epoch": 3.82, + "learning_rate": 1.0052034320509272e-05, + "loss": 0.0971, + "step": 39040 + }, + { + "epoch": 3.82, + "learning_rate": 1.0047882646000555e-05, + "loss": 0.1001, + "step": 39045 + }, + { + "epoch": 3.82, + "learning_rate": 1.0043730971491835e-05, + "loss": 0.1369, + "step": 39050 + }, + { + "epoch": 3.82, + "learning_rate": 1.0039579296983116e-05, + "loss": 0.0822, + "step": 39055 + }, + { + "epoch": 3.82, + "learning_rate": 1.0035427622474399e-05, + "loss": 0.0942, + "step": 39060 + }, + { + "epoch": 3.82, + "learning_rate": 1.003127594796568e-05, + "loss": 0.0961, + "step": 39065 + }, + { + "epoch": 3.82, + "learning_rate": 1.0027124273456962e-05, + "loss": 0.0985, + "step": 39070 + }, + { + "epoch": 3.82, + "learning_rate": 1.0022972598948243e-05, + "loss": 0.0922, + "step": 39075 + }, + { + "epoch": 3.82, + "learning_rate": 1.0018820924439523e-05, + "loss": 0.0966, + "step": 39080 + }, + { + "epoch": 3.82, + "learning_rate": 1.0014669249930806e-05, + "loss": 0.1118, + "step": 39085 + }, + { + "epoch": 3.82, + "learning_rate": 1.0010517575422088e-05, + "loss": 0.097, + "step": 39090 + }, + { + "epoch": 3.82, + "learning_rate": 1.0007196235815113e-05, + "loss": 0.0921, + "step": 39095 + }, + { + "epoch": 3.82, + "learning_rate": 1.0003044561306394e-05, + "loss": 0.1081, + "step": 39100 + }, + { + "epoch": 3.82, + "learning_rate": 9.998892886797675e-06, + "loss": 0.1089, + "step": 39105 + }, + { + "epoch": 3.82, + "learning_rate": 9.994741212288957e-06, + "loss": 0.0883, + "step": 39110 + }, + { + "epoch": 3.82, + "learning_rate": 9.990589537780238e-06, + "loss": 0.1136, + "step": 39115 + }, + { + "epoch": 3.83, + "learning_rate": 9.98643786327152e-06, + "loss": 0.1223, + "step": 39120 + }, + { + "epoch": 3.83, + "learning_rate": 9.982286188762801e-06, + "loss": 0.096, + "step": 39125 + }, + { + "epoch": 3.83, + "learning_rate": 9.978134514254082e-06, + "loss": 0.095, + "step": 39130 + }, + { + "epoch": 3.83, + "learning_rate": 9.973982839745364e-06, + "loss": 0.1097, + "step": 39135 + }, + { + "epoch": 3.83, + "learning_rate": 9.969831165236647e-06, + "loss": 0.1083, + "step": 39140 + }, + { + "epoch": 3.83, + "learning_rate": 9.965679490727927e-06, + "loss": 0.0964, + "step": 39145 + }, + { + "epoch": 3.83, + "learning_rate": 9.961527816219208e-06, + "loss": 0.1179, + "step": 39150 + }, + { + "epoch": 3.83, + "learning_rate": 9.957376141710489e-06, + "loss": 0.1016, + "step": 39155 + }, + { + "epoch": 3.83, + "learning_rate": 9.953224467201771e-06, + "loss": 0.0983, + "step": 39160 + }, + { + "epoch": 3.83, + "learning_rate": 9.949072792693054e-06, + "loss": 0.1162, + "step": 39165 + }, + { + "epoch": 3.83, + "learning_rate": 9.944921118184335e-06, + "loss": 0.1012, + "step": 39170 + }, + { + "epoch": 3.83, + "learning_rate": 9.940769443675615e-06, + "loss": 0.0965, + "step": 39175 + }, + { + "epoch": 3.83, + "learning_rate": 9.936617769166896e-06, + "loss": 0.0995, + "step": 39180 + }, + { + "epoch": 3.83, + "learning_rate": 9.93246609465818e-06, + "loss": 0.1149, + "step": 39185 + }, + { + "epoch": 3.83, + "learning_rate": 9.928314420149461e-06, + "loss": 0.0959, + "step": 39190 + }, + { + "epoch": 3.83, + "learning_rate": 9.924162745640742e-06, + "loss": 0.0821, + "step": 39195 + }, + { + "epoch": 3.83, + "learning_rate": 9.920011071132023e-06, + "loss": 0.1267, + "step": 39200 + }, + { + "epoch": 3.83, + "learning_rate": 9.915859396623305e-06, + "loss": 0.0936, + "step": 39205 + }, + { + "epoch": 3.83, + "learning_rate": 9.911707722114588e-06, + "loss": 0.0838, + "step": 39210 + }, + { + "epoch": 3.83, + "learning_rate": 9.907556047605868e-06, + "loss": 0.1219, + "step": 39215 + }, + { + "epoch": 3.84, + "learning_rate": 9.90340437309715e-06, + "loss": 0.1013, + "step": 39220 + }, + { + "epoch": 3.84, + "learning_rate": 9.89925269858843e-06, + "loss": 0.0983, + "step": 39225 + }, + { + "epoch": 3.84, + "learning_rate": 9.895101024079712e-06, + "loss": 0.1032, + "step": 39230 + }, + { + "epoch": 3.84, + "learning_rate": 9.890949349570995e-06, + "loss": 0.1165, + "step": 39235 + }, + { + "epoch": 3.84, + "learning_rate": 9.886797675062276e-06, + "loss": 0.0877, + "step": 39240 + }, + { + "epoch": 3.84, + "learning_rate": 9.882646000553556e-06, + "loss": 0.099, + "step": 39245 + }, + { + "epoch": 3.84, + "learning_rate": 9.878494326044839e-06, + "loss": 0.1125, + "step": 39250 + }, + { + "epoch": 3.84, + "learning_rate": 9.87434265153612e-06, + "loss": 0.0931, + "step": 39255 + }, + { + "epoch": 3.84, + "learning_rate": 9.870190977027402e-06, + "loss": 0.0921, + "step": 39260 + }, + { + "epoch": 3.84, + "learning_rate": 9.866039302518683e-06, + "loss": 0.1144, + "step": 39265 + }, + { + "epoch": 3.84, + "learning_rate": 9.861887628009964e-06, + "loss": 0.1083, + "step": 39270 + }, + { + "epoch": 3.84, + "learning_rate": 9.857735953501246e-06, + "loss": 0.0913, + "step": 39275 + }, + { + "epoch": 3.84, + "learning_rate": 9.853584278992527e-06, + "loss": 0.0945, + "step": 39280 + }, + { + "epoch": 3.84, + "learning_rate": 9.849432604483808e-06, + "loss": 0.1185, + "step": 39285 + }, + { + "epoch": 3.84, + "learning_rate": 9.84528092997509e-06, + "loss": 0.1061, + "step": 39290 + }, + { + "epoch": 3.84, + "learning_rate": 9.841129255466373e-06, + "loss": 0.0932, + "step": 39295 + }, + { + "epoch": 3.84, + "learning_rate": 9.836977580957653e-06, + "loss": 0.1038, + "step": 39300 + }, + { + "epoch": 3.84, + "learning_rate": 9.832825906448934e-06, + "loss": 0.1017, + "step": 39305 + }, + { + "epoch": 3.84, + "learning_rate": 9.828674231940215e-06, + "loss": 0.0966, + "step": 39310 + }, + { + "epoch": 3.84, + "learning_rate": 9.824522557431499e-06, + "loss": 0.114, + "step": 39315 + }, + { + "epoch": 3.84, + "learning_rate": 9.82037088292278e-06, + "loss": 0.1005, + "step": 39320 + }, + { + "epoch": 3.85, + "learning_rate": 9.81621920841406e-06, + "loss": 0.0934, + "step": 39325 + }, + { + "epoch": 3.85, + "learning_rate": 9.812067533905341e-06, + "loss": 0.0907, + "step": 39330 + }, + { + "epoch": 3.85, + "learning_rate": 9.807915859396622e-06, + "loss": 0.1102, + "step": 39335 + }, + { + "epoch": 3.85, + "learning_rate": 9.803764184887906e-06, + "loss": 0.0997, + "step": 39340 + }, + { + "epoch": 3.85, + "learning_rate": 9.799612510379187e-06, + "loss": 0.1, + "step": 39345 + }, + { + "epoch": 3.85, + "learning_rate": 9.795460835870468e-06, + "loss": 0.1108, + "step": 39350 + }, + { + "epoch": 3.85, + "learning_rate": 9.791309161361749e-06, + "loss": 0.0996, + "step": 39355 + }, + { + "epoch": 3.85, + "learning_rate": 9.787157486853031e-06, + "loss": 0.0856, + "step": 39360 + }, + { + "epoch": 3.85, + "learning_rate": 9.783005812344313e-06, + "loss": 0.1057, + "step": 39365 + }, + { + "epoch": 3.85, + "learning_rate": 9.778854137835594e-06, + "loss": 0.099, + "step": 39370 + }, + { + "epoch": 3.85, + "learning_rate": 9.774702463326875e-06, + "loss": 0.0899, + "step": 39375 + }, + { + "epoch": 3.85, + "learning_rate": 9.770550788818156e-06, + "loss": 0.0996, + "step": 39380 + }, + { + "epoch": 3.85, + "learning_rate": 9.766399114309438e-06, + "loss": 0.1091, + "step": 39385 + }, + { + "epoch": 3.85, + "learning_rate": 9.76224743980072e-06, + "loss": 0.1037, + "step": 39390 + }, + { + "epoch": 3.85, + "learning_rate": 9.758095765292001e-06, + "loss": 0.0928, + "step": 39395 + }, + { + "epoch": 3.85, + "learning_rate": 9.753944090783282e-06, + "loss": 0.0989, + "step": 39400 + }, + { + "epoch": 3.85, + "learning_rate": 9.749792416274565e-06, + "loss": 0.0986, + "step": 39405 + }, + { + "epoch": 3.85, + "learning_rate": 9.745640741765845e-06, + "loss": 0.1003, + "step": 39410 + }, + { + "epoch": 3.85, + "learning_rate": 9.741489067257128e-06, + "loss": 0.1096, + "step": 39415 + }, + { + "epoch": 3.85, + "learning_rate": 9.737337392748409e-06, + "loss": 0.1074, + "step": 39420 + }, + { + "epoch": 3.86, + "learning_rate": 9.733185718239691e-06, + "loss": 0.0955, + "step": 39425 + }, + { + "epoch": 3.86, + "learning_rate": 9.729034043730972e-06, + "loss": 0.1013, + "step": 39430 + }, + { + "epoch": 3.86, + "learning_rate": 9.724882369222253e-06, + "loss": 0.1269, + "step": 39435 + }, + { + "epoch": 3.86, + "learning_rate": 9.720730694713535e-06, + "loss": 0.0941, + "step": 39440 + }, + { + "epoch": 3.86, + "learning_rate": 9.716579020204816e-06, + "loss": 0.1031, + "step": 39445 + }, + { + "epoch": 3.86, + "learning_rate": 9.712427345696098e-06, + "loss": 0.1108, + "step": 39450 + }, + { + "epoch": 3.86, + "learning_rate": 9.70827567118738e-06, + "loss": 0.0987, + "step": 39455 + }, + { + "epoch": 3.86, + "learning_rate": 9.70412399667866e-06, + "loss": 0.0886, + "step": 39460 + }, + { + "epoch": 3.86, + "learning_rate": 9.699972322169942e-06, + "loss": 0.1113, + "step": 39465 + }, + { + "epoch": 3.86, + "learning_rate": 9.695820647661225e-06, + "loss": 0.1167, + "step": 39470 + }, + { + "epoch": 3.86, + "learning_rate": 9.691668973152506e-06, + "loss": 0.093, + "step": 39475 + }, + { + "epoch": 3.86, + "learning_rate": 9.687517298643786e-06, + "loss": 0.098, + "step": 39480 + }, + { + "epoch": 3.86, + "learning_rate": 9.683365624135067e-06, + "loss": 0.116, + "step": 39485 + }, + { + "epoch": 3.86, + "learning_rate": 9.679213949626348e-06, + "loss": 0.1049, + "step": 39490 + }, + { + "epoch": 3.86, + "learning_rate": 9.675062275117632e-06, + "loss": 0.0965, + "step": 39495 + }, + { + "epoch": 3.86, + "learning_rate": 9.670910600608913e-06, + "loss": 0.0899, + "step": 39500 + }, + { + "epoch": 3.86, + "eval_cer": 0.05518404702280615, + "eval_loss": 0.2266465127468109, + "eval_runtime": 275.5983, + "eval_samples_per_second": 59.398, + "eval_steps_per_second": 1.651, + "eval_wer": 0.14084221936360133, + "step": 39500 + }, + { + "epoch": 3.86, + "learning_rate": 9.666758926100194e-06, + "loss": 0.0938, + "step": 39505 + }, + { + "epoch": 3.86, + "learning_rate": 9.662607251591474e-06, + "loss": 0.092, + "step": 39510 + }, + { + "epoch": 3.86, + "learning_rate": 9.658455577082757e-06, + "loss": 0.1159, + "step": 39515 + }, + { + "epoch": 3.86, + "learning_rate": 9.65430390257404e-06, + "loss": 0.1034, + "step": 39520 + }, + { + "epoch": 3.86, + "learning_rate": 9.65015222806532e-06, + "loss": 0.0967, + "step": 39525 + }, + { + "epoch": 3.87, + "learning_rate": 9.646000553556601e-06, + "loss": 0.1059, + "step": 39530 + }, + { + "epoch": 3.87, + "learning_rate": 9.641848879047883e-06, + "loss": 0.1194, + "step": 39535 + }, + { + "epoch": 3.87, + "learning_rate": 9.637697204539164e-06, + "loss": 0.0946, + "step": 39540 + }, + { + "epoch": 3.87, + "learning_rate": 9.633545530030447e-06, + "loss": 0.0918, + "step": 39545 + }, + { + "epoch": 3.87, + "learning_rate": 9.629393855521727e-06, + "loss": 0.1177, + "step": 39550 + }, + { + "epoch": 3.87, + "learning_rate": 9.625242181013008e-06, + "loss": 0.1067, + "step": 39555 + }, + { + "epoch": 3.87, + "learning_rate": 9.62109050650429e-06, + "loss": 0.0964, + "step": 39560 + }, + { + "epoch": 3.87, + "learning_rate": 9.616938831995571e-06, + "loss": 0.1197, + "step": 39565 + }, + { + "epoch": 3.87, + "learning_rate": 9.612787157486854e-06, + "loss": 0.0953, + "step": 39570 + }, + { + "epoch": 3.87, + "learning_rate": 9.608635482978135e-06, + "loss": 0.0838, + "step": 39575 + }, + { + "epoch": 3.87, + "learning_rate": 9.604483808469417e-06, + "loss": 0.1203, + "step": 39580 + }, + { + "epoch": 3.87, + "learning_rate": 9.600332133960698e-06, + "loss": 0.1133, + "step": 39585 + }, + { + "epoch": 3.87, + "learning_rate": 9.596180459451979e-06, + "loss": 0.0798, + "step": 39590 + }, + { + "epoch": 3.87, + "learning_rate": 9.592028784943261e-06, + "loss": 0.0938, + "step": 39595 + }, + { + "epoch": 3.87, + "learning_rate": 9.587877110434542e-06, + "loss": 0.1038, + "step": 39600 + }, + { + "epoch": 3.87, + "learning_rate": 9.583725435925824e-06, + "loss": 0.0818, + "step": 39605 + }, + { + "epoch": 3.87, + "learning_rate": 9.579573761417105e-06, + "loss": 0.0827, + "step": 39610 + }, + { + "epoch": 3.87, + "learning_rate": 9.575422086908386e-06, + "loss": 0.1196, + "step": 39615 + }, + { + "epoch": 3.87, + "learning_rate": 9.571270412399668e-06, + "loss": 0.0961, + "step": 39620 + }, + { + "epoch": 3.87, + "learning_rate": 9.56711873789095e-06, + "loss": 0.0975, + "step": 39625 + }, + { + "epoch": 3.88, + "learning_rate": 9.562967063382231e-06, + "loss": 0.0982, + "step": 39630 + }, + { + "epoch": 3.88, + "learning_rate": 9.558815388873512e-06, + "loss": 0.1122, + "step": 39635 + }, + { + "epoch": 3.88, + "learning_rate": 9.554663714364793e-06, + "loss": 0.1016, + "step": 39640 + }, + { + "epoch": 3.88, + "learning_rate": 9.550512039856077e-06, + "loss": 0.1015, + "step": 39645 + }, + { + "epoch": 3.88, + "learning_rate": 9.546360365347358e-06, + "loss": 0.1148, + "step": 39650 + }, + { + "epoch": 3.88, + "learning_rate": 9.542208690838639e-06, + "loss": 0.0911, + "step": 39655 + }, + { + "epoch": 3.88, + "learning_rate": 9.53805701632992e-06, + "loss": 0.0862, + "step": 39660 + }, + { + "epoch": 3.88, + "learning_rate": 9.5339053418212e-06, + "loss": 0.1161, + "step": 39665 + }, + { + "epoch": 3.88, + "learning_rate": 9.529753667312483e-06, + "loss": 0.0983, + "step": 39670 + }, + { + "epoch": 3.88, + "learning_rate": 9.525601992803765e-06, + "loss": 0.087, + "step": 39675 + }, + { + "epoch": 3.88, + "learning_rate": 9.521450318295046e-06, + "loss": 0.1104, + "step": 39680 + }, + { + "epoch": 3.88, + "learning_rate": 9.517298643786327e-06, + "loss": 0.1113, + "step": 39685 + }, + { + "epoch": 3.88, + "learning_rate": 9.51314696927761e-06, + "loss": 0.095, + "step": 39690 + }, + { + "epoch": 3.88, + "learning_rate": 9.50899529476889e-06, + "loss": 0.0904, + "step": 39695 + }, + { + "epoch": 3.88, + "learning_rate": 9.504843620260172e-06, + "loss": 0.1192, + "step": 39700 + }, + { + "epoch": 3.88, + "learning_rate": 9.500691945751453e-06, + "loss": 0.1016, + "step": 39705 + }, + { + "epoch": 3.88, + "learning_rate": 9.496540271242734e-06, + "loss": 0.0881, + "step": 39710 + }, + { + "epoch": 3.88, + "learning_rate": 9.492388596734016e-06, + "loss": 0.1335, + "step": 39715 + }, + { + "epoch": 3.88, + "learning_rate": 9.488236922225297e-06, + "loss": 0.1019, + "step": 39720 + }, + { + "epoch": 3.88, + "learning_rate": 9.48408524771658e-06, + "loss": 0.091, + "step": 39725 + }, + { + "epoch": 3.88, + "learning_rate": 9.47993357320786e-06, + "loss": 0.1215, + "step": 39730 + }, + { + "epoch": 3.89, + "learning_rate": 9.475781898699143e-06, + "loss": 0.1043, + "step": 39735 + }, + { + "epoch": 3.89, + "learning_rate": 9.471630224190424e-06, + "loss": 0.0981, + "step": 39740 + }, + { + "epoch": 3.89, + "learning_rate": 9.467478549681704e-06, + "loss": 0.0801, + "step": 39745 + }, + { + "epoch": 3.89, + "learning_rate": 9.463326875172987e-06, + "loss": 0.1259, + "step": 39750 + }, + { + "epoch": 3.89, + "learning_rate": 9.459175200664268e-06, + "loss": 0.1049, + "step": 39755 + }, + { + "epoch": 3.89, + "learning_rate": 9.45502352615555e-06, + "loss": 0.091, + "step": 39760 + }, + { + "epoch": 3.89, + "learning_rate": 9.450871851646831e-06, + "loss": 0.1032, + "step": 39765 + }, + { + "epoch": 3.89, + "learning_rate": 9.446720177138112e-06, + "loss": 0.1037, + "step": 39770 + }, + { + "epoch": 3.89, + "learning_rate": 9.442568502629394e-06, + "loss": 0.0903, + "step": 39775 + }, + { + "epoch": 3.89, + "learning_rate": 9.438416828120677e-06, + "loss": 0.098, + "step": 39780 + }, + { + "epoch": 3.89, + "learning_rate": 9.434265153611957e-06, + "loss": 0.1125, + "step": 39785 + }, + { + "epoch": 3.89, + "learning_rate": 9.430113479103238e-06, + "loss": 0.0955, + "step": 39790 + }, + { + "epoch": 3.89, + "learning_rate": 9.425961804594519e-06, + "loss": 0.0919, + "step": 39795 + }, + { + "epoch": 3.89, + "learning_rate": 9.421810130085803e-06, + "loss": 0.1235, + "step": 39800 + }, + { + "epoch": 3.89, + "learning_rate": 9.417658455577084e-06, + "loss": 0.0937, + "step": 39805 + }, + { + "epoch": 3.89, + "learning_rate": 9.413506781068365e-06, + "loss": 0.0959, + "step": 39810 + }, + { + "epoch": 3.89, + "learning_rate": 9.409355106559645e-06, + "loss": 0.1264, + "step": 39815 + }, + { + "epoch": 3.89, + "learning_rate": 9.405203432050926e-06, + "loss": 0.1098, + "step": 39820 + }, + { + "epoch": 3.89, + "learning_rate": 9.40105175754221e-06, + "loss": 0.096, + "step": 39825 + }, + { + "epoch": 3.89, + "learning_rate": 9.396900083033491e-06, + "loss": 0.1052, + "step": 39830 + }, + { + "epoch": 3.9, + "learning_rate": 9.392748408524772e-06, + "loss": 0.116, + "step": 39835 + }, + { + "epoch": 3.9, + "learning_rate": 9.388596734016053e-06, + "loss": 0.1109, + "step": 39840 + }, + { + "epoch": 3.9, + "learning_rate": 9.384445059507335e-06, + "loss": 0.0948, + "step": 39845 + }, + { + "epoch": 3.9, + "learning_rate": 9.380293384998617e-06, + "loss": 0.0992, + "step": 39850 + }, + { + "epoch": 3.9, + "learning_rate": 9.376141710489898e-06, + "loss": 0.0952, + "step": 39855 + }, + { + "epoch": 3.9, + "learning_rate": 9.371990035981179e-06, + "loss": 0.0916, + "step": 39860 + }, + { + "epoch": 3.9, + "learning_rate": 9.36783836147246e-06, + "loss": 0.1025, + "step": 39865 + }, + { + "epoch": 3.9, + "learning_rate": 9.363686686963742e-06, + "loss": 0.1032, + "step": 39870 + }, + { + "epoch": 3.9, + "learning_rate": 9.359535012455025e-06, + "loss": 0.089, + "step": 39875 + }, + { + "epoch": 3.9, + "learning_rate": 9.355383337946305e-06, + "loss": 0.1195, + "step": 39880 + }, + { + "epoch": 3.9, + "learning_rate": 9.351231663437586e-06, + "loss": 0.1148, + "step": 39885 + }, + { + "epoch": 3.9, + "learning_rate": 9.347079988928869e-06, + "loss": 0.0929, + "step": 39890 + }, + { + "epoch": 3.9, + "learning_rate": 9.34292831442015e-06, + "loss": 0.102, + "step": 39895 + }, + { + "epoch": 3.9, + "learning_rate": 9.33877663991143e-06, + "loss": 0.128, + "step": 39900 + }, + { + "epoch": 3.9, + "learning_rate": 9.334624965402713e-06, + "loss": 0.1012, + "step": 39905 + }, + { + "epoch": 3.9, + "learning_rate": 9.330473290893995e-06, + "loss": 0.0865, + "step": 39910 + }, + { + "epoch": 3.9, + "learning_rate": 9.326321616385276e-06, + "loss": 0.1172, + "step": 39915 + }, + { + "epoch": 3.9, + "learning_rate": 9.322169941876557e-06, + "loss": 0.0951, + "step": 39920 + }, + { + "epoch": 3.9, + "learning_rate": 9.318018267367837e-06, + "loss": 0.0965, + "step": 39925 + }, + { + "epoch": 3.9, + "learning_rate": 9.31386659285912e-06, + "loss": 0.1043, + "step": 39930 + }, + { + "epoch": 3.9, + "learning_rate": 9.309714918350402e-06, + "loss": 0.1439, + "step": 39935 + }, + { + "epoch": 3.91, + "learning_rate": 9.305563243841683e-06, + "loss": 0.1126, + "step": 39940 + }, + { + "epoch": 3.91, + "learning_rate": 9.301411569332964e-06, + "loss": 0.0814, + "step": 39945 + }, + { + "epoch": 3.91, + "learning_rate": 9.297259894824245e-06, + "loss": 0.1247, + "step": 39950 + }, + { + "epoch": 3.91, + "learning_rate": 9.293108220315529e-06, + "loss": 0.1051, + "step": 39955 + }, + { + "epoch": 3.91, + "learning_rate": 9.28895654580681e-06, + "loss": 0.097, + "step": 39960 + }, + { + "epoch": 3.91, + "learning_rate": 9.28480487129809e-06, + "loss": 0.1092, + "step": 39965 + }, + { + "epoch": 3.91, + "learning_rate": 9.280653196789371e-06, + "loss": 0.1002, + "step": 39970 + }, + { + "epoch": 3.91, + "learning_rate": 9.276501522280652e-06, + "loss": 0.0919, + "step": 39975 + }, + { + "epoch": 3.91, + "learning_rate": 9.272349847771936e-06, + "loss": 0.0907, + "step": 39980 + }, + { + "epoch": 3.91, + "learning_rate": 9.268198173263217e-06, + "loss": 0.1191, + "step": 39985 + }, + { + "epoch": 3.91, + "learning_rate": 9.264046498754498e-06, + "loss": 0.097, + "step": 39990 + }, + { + "epoch": 3.91, + "learning_rate": 9.259894824245778e-06, + "loss": 0.1005, + "step": 39995 + }, + { + "epoch": 3.91, + "learning_rate": 9.255743149737061e-06, + "loss": 0.123, + "step": 40000 + }, + { + "epoch": 3.91, + "eval_cer": 0.05552973494176488, + "eval_loss": 0.22539959847927094, + "eval_runtime": 274.803, + "eval_samples_per_second": 59.57, + "eval_steps_per_second": 1.656, + "eval_wer": 0.1419457631102956, + "step": 40000 + }, + { + "epoch": 3.91, + "learning_rate": 9.251591475228343e-06, + "loss": 0.0858, + "step": 40005 + }, + { + "epoch": 3.91, + "learning_rate": 9.247439800719624e-06, + "loss": 0.1006, + "step": 40010 + }, + { + "epoch": 3.91, + "learning_rate": 9.243288126210905e-06, + "loss": 0.1131, + "step": 40015 + }, + { + "epoch": 3.91, + "learning_rate": 9.239136451702187e-06, + "loss": 0.097, + "step": 40020 + }, + { + "epoch": 3.91, + "learning_rate": 9.234984777193468e-06, + "loss": 0.0915, + "step": 40025 + }, + { + "epoch": 3.91, + "learning_rate": 9.23083310268475e-06, + "loss": 0.1057, + "step": 40030 + }, + { + "epoch": 3.91, + "learning_rate": 9.226681428176031e-06, + "loss": 0.1085, + "step": 40035 + }, + { + "epoch": 3.92, + "learning_rate": 9.222529753667312e-06, + "loss": 0.0882, + "step": 40040 + }, + { + "epoch": 3.92, + "learning_rate": 9.218378079158595e-06, + "loss": 0.1006, + "step": 40045 + }, + { + "epoch": 3.92, + "learning_rate": 9.214226404649875e-06, + "loss": 0.1097, + "step": 40050 + }, + { + "epoch": 3.92, + "learning_rate": 9.210074730141158e-06, + "loss": 0.1015, + "step": 40055 + }, + { + "epoch": 3.92, + "learning_rate": 9.205923055632439e-06, + "loss": 0.0912, + "step": 40060 + }, + { + "epoch": 3.92, + "learning_rate": 9.201771381123721e-06, + "loss": 0.1183, + "step": 40065 + }, + { + "epoch": 3.92, + "learning_rate": 9.197619706615002e-06, + "loss": 0.1101, + "step": 40070 + }, + { + "epoch": 3.92, + "learning_rate": 9.193468032106283e-06, + "loss": 0.0862, + "step": 40075 + }, + { + "epoch": 3.92, + "learning_rate": 9.189316357597565e-06, + "loss": 0.106, + "step": 40080 + }, + { + "epoch": 3.92, + "learning_rate": 9.185164683088846e-06, + "loss": 0.1156, + "step": 40085 + }, + { + "epoch": 3.92, + "learning_rate": 9.181013008580128e-06, + "loss": 0.0979, + "step": 40090 + }, + { + "epoch": 3.92, + "learning_rate": 9.176861334071409e-06, + "loss": 0.1004, + "step": 40095 + }, + { + "epoch": 3.92, + "learning_rate": 9.17270965956269e-06, + "loss": 0.1295, + "step": 40100 + }, + { + "epoch": 3.92, + "learning_rate": 9.16855798505397e-06, + "loss": 0.1076, + "step": 40105 + }, + { + "epoch": 3.92, + "learning_rate": 9.164406310545255e-06, + "loss": 0.0893, + "step": 40110 + }, + { + "epoch": 3.92, + "learning_rate": 9.160254636036535e-06, + "loss": 0.1133, + "step": 40115 + }, + { + "epoch": 3.92, + "learning_rate": 9.156102961527816e-06, + "loss": 0.11, + "step": 40120 + }, + { + "epoch": 3.92, + "learning_rate": 9.151951287019097e-06, + "loss": 0.0954, + "step": 40125 + }, + { + "epoch": 3.92, + "learning_rate": 9.14779961251038e-06, + "loss": 0.0888, + "step": 40130 + }, + { + "epoch": 3.92, + "learning_rate": 9.143647938001662e-06, + "loss": 0.1097, + "step": 40135 + }, + { + "epoch": 3.93, + "learning_rate": 9.139496263492943e-06, + "loss": 0.1073, + "step": 40140 + }, + { + "epoch": 3.93, + "learning_rate": 9.135344588984223e-06, + "loss": 0.0978, + "step": 40145 + }, + { + "epoch": 3.93, + "learning_rate": 9.131192914475504e-06, + "loss": 0.1074, + "step": 40150 + }, + { + "epoch": 3.93, + "learning_rate": 9.127041239966787e-06, + "loss": 0.098, + "step": 40155 + }, + { + "epoch": 3.93, + "learning_rate": 9.12288956545807e-06, + "loss": 0.0951, + "step": 40160 + }, + { + "epoch": 3.93, + "learning_rate": 9.11873789094935e-06, + "loss": 0.1033, + "step": 40165 + }, + { + "epoch": 3.93, + "learning_rate": 9.11458621644063e-06, + "loss": 0.0994, + "step": 40170 + }, + { + "epoch": 3.93, + "learning_rate": 9.110434541931913e-06, + "loss": 0.1009, + "step": 40175 + }, + { + "epoch": 3.93, + "learning_rate": 9.106282867423194e-06, + "loss": 0.0971, + "step": 40180 + }, + { + "epoch": 3.93, + "learning_rate": 9.102131192914476e-06, + "loss": 0.1153, + "step": 40185 + }, + { + "epoch": 3.93, + "learning_rate": 9.097979518405757e-06, + "loss": 0.0995, + "step": 40190 + }, + { + "epoch": 3.93, + "learning_rate": 9.093827843897038e-06, + "loss": 0.0875, + "step": 40195 + }, + { + "epoch": 3.93, + "learning_rate": 9.08967616938832e-06, + "loss": 0.106, + "step": 40200 + }, + { + "epoch": 3.93, + "learning_rate": 9.085524494879601e-06, + "loss": 0.093, + "step": 40205 + }, + { + "epoch": 3.93, + "learning_rate": 9.081372820370884e-06, + "loss": 0.1032, + "step": 40210 + }, + { + "epoch": 3.93, + "learning_rate": 9.077221145862164e-06, + "loss": 0.1005, + "step": 40215 + }, + { + "epoch": 3.93, + "learning_rate": 9.073069471353447e-06, + "loss": 0.0974, + "step": 40220 + }, + { + "epoch": 3.93, + "learning_rate": 9.068917796844728e-06, + "loss": 0.0884, + "step": 40225 + }, + { + "epoch": 3.93, + "learning_rate": 9.064766122336008e-06, + "loss": 0.1004, + "step": 40230 + }, + { + "epoch": 3.93, + "learning_rate": 9.06061444782729e-06, + "loss": 0.11, + "step": 40235 + }, + { + "epoch": 3.93, + "learning_rate": 9.056462773318573e-06, + "loss": 0.1033, + "step": 40240 + }, + { + "epoch": 3.94, + "learning_rate": 9.052311098809854e-06, + "loss": 0.0916, + "step": 40245 + }, + { + "epoch": 3.94, + "learning_rate": 9.048159424301135e-06, + "loss": 0.1232, + "step": 40250 + }, + { + "epoch": 3.94, + "learning_rate": 9.044007749792416e-06, + "loss": 0.0995, + "step": 40255 + }, + { + "epoch": 3.94, + "learning_rate": 9.039856075283698e-06, + "loss": 0.1164, + "step": 40260 + }, + { + "epoch": 3.94, + "learning_rate": 9.03570440077498e-06, + "loss": 0.116, + "step": 40265 + }, + { + "epoch": 3.94, + "learning_rate": 9.031552726266261e-06, + "loss": 0.0991, + "step": 40270 + }, + { + "epoch": 3.94, + "learning_rate": 9.027401051757542e-06, + "loss": 0.0954, + "step": 40275 + }, + { + "epoch": 3.94, + "learning_rate": 9.023249377248823e-06, + "loss": 0.1105, + "step": 40280 + }, + { + "epoch": 3.94, + "learning_rate": 9.019097702740105e-06, + "loss": 0.1058, + "step": 40285 + }, + { + "epoch": 3.94, + "learning_rate": 9.014946028231388e-06, + "loss": 0.0751, + "step": 40290 + }, + { + "epoch": 3.94, + "learning_rate": 9.010794353722669e-06, + "loss": 0.0846, + "step": 40295 + }, + { + "epoch": 3.94, + "learning_rate": 9.00664267921395e-06, + "loss": 0.1105, + "step": 40300 + }, + { + "epoch": 3.94, + "learning_rate": 9.00249100470523e-06, + "loss": 0.0964, + "step": 40305 + }, + { + "epoch": 3.94, + "learning_rate": 8.998339330196513e-06, + "loss": 0.0963, + "step": 40310 + }, + { + "epoch": 3.94, + "learning_rate": 8.994187655687795e-06, + "loss": 0.1209, + "step": 40315 + }, + { + "epoch": 3.94, + "learning_rate": 8.990035981179076e-06, + "loss": 0.1008, + "step": 40320 + }, + { + "epoch": 3.94, + "learning_rate": 8.985884306670357e-06, + "loss": 0.0844, + "step": 40325 + }, + { + "epoch": 3.94, + "learning_rate": 8.981732632161639e-06, + "loss": 0.0937, + "step": 40330 + }, + { + "epoch": 3.94, + "learning_rate": 8.97758095765292e-06, + "loss": 0.1052, + "step": 40335 + }, + { + "epoch": 3.94, + "learning_rate": 8.973429283144202e-06, + "loss": 0.1036, + "step": 40340 + }, + { + "epoch": 3.95, + "learning_rate": 8.969277608635483e-06, + "loss": 0.0975, + "step": 40345 + }, + { + "epoch": 3.95, + "learning_rate": 8.965125934126765e-06, + "loss": 0.1052, + "step": 40350 + }, + { + "epoch": 3.95, + "learning_rate": 8.960974259618046e-06, + "loss": 0.0937, + "step": 40355 + }, + { + "epoch": 3.95, + "learning_rate": 8.956822585109327e-06, + "loss": 0.0923, + "step": 40360 + }, + { + "epoch": 3.95, + "learning_rate": 8.95267091060061e-06, + "loss": 0.1072, + "step": 40365 + }, + { + "epoch": 3.95, + "learning_rate": 8.94851923609189e-06, + "loss": 0.1065, + "step": 40370 + }, + { + "epoch": 3.95, + "learning_rate": 8.944367561583173e-06, + "loss": 0.086, + "step": 40375 + }, + { + "epoch": 3.95, + "learning_rate": 8.940215887074453e-06, + "loss": 0.0969, + "step": 40380 + }, + { + "epoch": 3.95, + "learning_rate": 8.936064212565734e-06, + "loss": 0.1124, + "step": 40385 + }, + { + "epoch": 3.95, + "learning_rate": 8.931912538057017e-06, + "loss": 0.1081, + "step": 40390 + }, + { + "epoch": 3.95, + "learning_rate": 8.927760863548299e-06, + "loss": 0.0986, + "step": 40395 + }, + { + "epoch": 3.95, + "learning_rate": 8.92360918903958e-06, + "loss": 0.1299, + "step": 40400 + }, + { + "epoch": 3.95, + "learning_rate": 8.91945751453086e-06, + "loss": 0.0952, + "step": 40405 + }, + { + "epoch": 3.95, + "learning_rate": 8.915305840022141e-06, + "loss": 0.0941, + "step": 40410 + }, + { + "epoch": 3.95, + "learning_rate": 8.911154165513424e-06, + "loss": 0.0936, + "step": 40415 + }, + { + "epoch": 3.95, + "learning_rate": 8.907002491004706e-06, + "loss": 0.0999, + "step": 40420 + }, + { + "epoch": 3.95, + "learning_rate": 8.902850816495987e-06, + "loss": 0.0875, + "step": 40425 + }, + { + "epoch": 3.95, + "learning_rate": 8.898699141987268e-06, + "loss": 0.0975, + "step": 40430 + }, + { + "epoch": 3.95, + "learning_rate": 8.894547467478549e-06, + "loss": 0.1209, + "step": 40435 + }, + { + "epoch": 3.95, + "learning_rate": 8.890395792969833e-06, + "loss": 0.0881, + "step": 40440 + }, + { + "epoch": 3.95, + "learning_rate": 8.886244118461114e-06, + "loss": 0.0915, + "step": 40445 + }, + { + "epoch": 3.96, + "learning_rate": 8.882092443952394e-06, + "loss": 0.1248, + "step": 40450 + }, + { + "epoch": 3.96, + "learning_rate": 8.877940769443675e-06, + "loss": 0.0952, + "step": 40455 + }, + { + "epoch": 3.96, + "learning_rate": 8.873789094934956e-06, + "loss": 0.0873, + "step": 40460 + }, + { + "epoch": 3.96, + "learning_rate": 8.86963742042624e-06, + "loss": 0.1183, + "step": 40465 + }, + { + "epoch": 3.96, + "learning_rate": 8.86548574591752e-06, + "loss": 0.1046, + "step": 40470 + }, + { + "epoch": 3.96, + "learning_rate": 8.861334071408802e-06, + "loss": 0.0996, + "step": 40475 + }, + { + "epoch": 3.96, + "learning_rate": 8.857182396900082e-06, + "loss": 0.0978, + "step": 40480 + }, + { + "epoch": 3.96, + "learning_rate": 8.853030722391365e-06, + "loss": 0.0983, + "step": 40485 + }, + { + "epoch": 3.96, + "learning_rate": 8.848879047882647e-06, + "loss": 0.098, + "step": 40490 + }, + { + "epoch": 3.96, + "learning_rate": 8.844727373373928e-06, + "loss": 0.0993, + "step": 40495 + }, + { + "epoch": 3.96, + "learning_rate": 8.840575698865209e-06, + "loss": 0.1162, + "step": 40500 + }, + { + "epoch": 3.96, + "eval_cer": 0.05570778156223192, + "eval_loss": 0.22509299218654633, + "eval_runtime": 275.6477, + "eval_samples_per_second": 59.387, + "eval_steps_per_second": 1.651, + "eval_wer": 0.1422461359644254, + "step": 40500 + }, + { + "epoch": 3.96, + "learning_rate": 8.836424024356491e-06, + "loss": 0.0828, + "step": 40505 + }, + { + "epoch": 3.96, + "learning_rate": 8.832272349847772e-06, + "loss": 0.0874, + "step": 40510 + }, + { + "epoch": 3.96, + "learning_rate": 8.828120675339053e-06, + "loss": 0.1193, + "step": 40515 + }, + { + "epoch": 3.96, + "learning_rate": 8.823969000830335e-06, + "loss": 0.108, + "step": 40520 + }, + { + "epoch": 3.96, + "learning_rate": 8.819817326321616e-06, + "loss": 0.0971, + "step": 40525 + }, + { + "epoch": 3.96, + "learning_rate": 8.815665651812899e-06, + "loss": 0.1089, + "step": 40530 + }, + { + "epoch": 3.96, + "learning_rate": 8.81151397730418e-06, + "loss": 0.1103, + "step": 40535 + }, + { + "epoch": 3.96, + "learning_rate": 8.80736230279546e-06, + "loss": 0.0973, + "step": 40540 + }, + { + "epoch": 3.96, + "learning_rate": 8.803210628286743e-06, + "loss": 0.0956, + "step": 40545 + }, + { + "epoch": 3.97, + "learning_rate": 8.799058953778025e-06, + "loss": 0.1316, + "step": 40550 + }, + { + "epoch": 3.97, + "learning_rate": 8.794907279269306e-06, + "loss": 0.0967, + "step": 40555 + }, + { + "epoch": 3.97, + "learning_rate": 8.790755604760587e-06, + "loss": 0.0926, + "step": 40560 + }, + { + "epoch": 3.97, + "learning_rate": 8.786603930251867e-06, + "loss": 0.1167, + "step": 40565 + }, + { + "epoch": 3.97, + "learning_rate": 8.78245225574315e-06, + "loss": 0.1215, + "step": 40570 + }, + { + "epoch": 3.97, + "learning_rate": 8.778300581234432e-06, + "loss": 0.0903, + "step": 40575 + }, + { + "epoch": 3.97, + "learning_rate": 8.774148906725713e-06, + "loss": 0.1082, + "step": 40580 + }, + { + "epoch": 3.97, + "learning_rate": 8.769997232216994e-06, + "loss": 0.0998, + "step": 40585 + }, + { + "epoch": 3.97, + "learning_rate": 8.765845557708275e-06, + "loss": 0.0874, + "step": 40590 + }, + { + "epoch": 3.97, + "learning_rate": 8.761693883199559e-06, + "loss": 0.0873, + "step": 40595 + }, + { + "epoch": 3.97, + "learning_rate": 8.75754220869084e-06, + "loss": 0.1111, + "step": 40600 + }, + { + "epoch": 3.97, + "learning_rate": 8.75339053418212e-06, + "loss": 0.1032, + "step": 40605 + }, + { + "epoch": 3.97, + "learning_rate": 8.749238859673401e-06, + "loss": 0.0984, + "step": 40610 + }, + { + "epoch": 3.97, + "learning_rate": 8.745087185164683e-06, + "loss": 0.1226, + "step": 40615 + }, + { + "epoch": 3.97, + "learning_rate": 8.740935510655966e-06, + "loss": 0.1079, + "step": 40620 + }, + { + "epoch": 3.97, + "learning_rate": 8.736783836147247e-06, + "loss": 0.092, + "step": 40625 + }, + { + "epoch": 3.97, + "learning_rate": 8.732632161638527e-06, + "loss": 0.0945, + "step": 40630 + }, + { + "epoch": 3.97, + "learning_rate": 8.728480487129808e-06, + "loss": 0.1133, + "step": 40635 + }, + { + "epoch": 3.97, + "learning_rate": 8.72432881262109e-06, + "loss": 0.0915, + "step": 40640 + }, + { + "epoch": 3.97, + "learning_rate": 8.720177138112373e-06, + "loss": 0.0988, + "step": 40645 + }, + { + "epoch": 3.97, + "learning_rate": 8.716025463603654e-06, + "loss": 0.1122, + "step": 40650 + }, + { + "epoch": 3.98, + "learning_rate": 8.711873789094935e-06, + "loss": 0.0968, + "step": 40655 + }, + { + "epoch": 3.98, + "learning_rate": 8.707722114586217e-06, + "loss": 0.086, + "step": 40660 + }, + { + "epoch": 3.98, + "learning_rate": 8.703570440077498e-06, + "loss": 0.098, + "step": 40665 + }, + { + "epoch": 3.98, + "learning_rate": 8.69941876556878e-06, + "loss": 0.0933, + "step": 40670 + }, + { + "epoch": 3.98, + "learning_rate": 8.695267091060061e-06, + "loss": 0.093, + "step": 40675 + }, + { + "epoch": 3.98, + "learning_rate": 8.691115416551342e-06, + "loss": 0.0879, + "step": 40680 + }, + { + "epoch": 3.98, + "learning_rate": 8.686963742042624e-06, + "loss": 0.112, + "step": 40685 + }, + { + "epoch": 3.98, + "learning_rate": 8.682812067533905e-06, + "loss": 0.0939, + "step": 40690 + }, + { + "epoch": 3.98, + "learning_rate": 8.678660393025188e-06, + "loss": 0.0892, + "step": 40695 + }, + { + "epoch": 3.98, + "learning_rate": 8.674508718516468e-06, + "loss": 0.1259, + "step": 40700 + }, + { + "epoch": 3.98, + "learning_rate": 8.67035704400775e-06, + "loss": 0.0971, + "step": 40705 + }, + { + "epoch": 3.98, + "learning_rate": 8.666205369499032e-06, + "loss": 0.0915, + "step": 40710 + }, + { + "epoch": 3.98, + "learning_rate": 8.662053694990312e-06, + "loss": 0.1178, + "step": 40715 + }, + { + "epoch": 3.98, + "learning_rate": 8.657902020481593e-06, + "loss": 0.1101, + "step": 40720 + }, + { + "epoch": 3.98, + "learning_rate": 8.653750345972877e-06, + "loss": 0.0822, + "step": 40725 + }, + { + "epoch": 3.98, + "learning_rate": 8.649598671464158e-06, + "loss": 0.0933, + "step": 40730 + }, + { + "epoch": 3.98, + "learning_rate": 8.645446996955439e-06, + "loss": 0.1147, + "step": 40735 + }, + { + "epoch": 3.98, + "learning_rate": 8.64129532244672e-06, + "loss": 0.0919, + "step": 40740 + }, + { + "epoch": 3.98, + "learning_rate": 8.637143647938e-06, + "loss": 0.102, + "step": 40745 + }, + { + "epoch": 3.98, + "learning_rate": 8.632991973429285e-06, + "loss": 0.1042, + "step": 40750 + }, + { + "epoch": 3.99, + "learning_rate": 8.628840298920565e-06, + "loss": 0.0984, + "step": 40755 + }, + { + "epoch": 3.99, + "learning_rate": 8.624688624411846e-06, + "loss": 0.0981, + "step": 40760 + }, + { + "epoch": 3.99, + "learning_rate": 8.620536949903127e-06, + "loss": 0.1059, + "step": 40765 + }, + { + "epoch": 3.99, + "learning_rate": 8.61638527539441e-06, + "loss": 0.0849, + "step": 40770 + }, + { + "epoch": 3.99, + "learning_rate": 8.612233600885692e-06, + "loss": 0.0882, + "step": 40775 + }, + { + "epoch": 3.99, + "learning_rate": 8.608081926376973e-06, + "loss": 0.1057, + "step": 40780 + }, + { + "epoch": 3.99, + "learning_rate": 8.603930251868253e-06, + "loss": 0.119, + "step": 40785 + }, + { + "epoch": 3.99, + "learning_rate": 8.599778577359534e-06, + "loss": 0.0934, + "step": 40790 + }, + { + "epoch": 3.99, + "learning_rate": 8.595626902850817e-06, + "loss": 0.0883, + "step": 40795 + }, + { + "epoch": 3.99, + "learning_rate": 8.591475228342099e-06, + "loss": 0.1243, + "step": 40800 + }, + { + "epoch": 3.99, + "learning_rate": 8.58732355383338e-06, + "loss": 0.0865, + "step": 40805 + }, + { + "epoch": 3.99, + "learning_rate": 8.58317187932466e-06, + "loss": 0.0868, + "step": 40810 + }, + { + "epoch": 3.99, + "learning_rate": 8.579020204815943e-06, + "loss": 0.1152, + "step": 40815 + }, + { + "epoch": 3.99, + "learning_rate": 8.574868530307224e-06, + "loss": 0.0958, + "step": 40820 + }, + { + "epoch": 3.99, + "learning_rate": 8.570716855798506e-06, + "loss": 0.0837, + "step": 40825 + }, + { + "epoch": 3.99, + "learning_rate": 8.566565181289787e-06, + "loss": 0.1045, + "step": 40830 + }, + { + "epoch": 3.99, + "learning_rate": 8.56241350678107e-06, + "loss": 0.1134, + "step": 40835 + }, + { + "epoch": 3.99, + "learning_rate": 8.55826183227235e-06, + "loss": 0.0882, + "step": 40840 + }, + { + "epoch": 3.99, + "learning_rate": 8.554110157763631e-06, + "loss": 0.0875, + "step": 40845 + }, + { + "epoch": 3.99, + "learning_rate": 8.549958483254913e-06, + "loss": 0.1285, + "step": 40850 + }, + { + "epoch": 3.99, + "learning_rate": 8.545806808746194e-06, + "loss": 0.1039, + "step": 40855 + }, + { + "epoch": 4.0, + "learning_rate": 8.541655134237477e-06, + "loss": 0.0889, + "step": 40860 + }, + { + "epoch": 4.0, + "learning_rate": 8.537503459728757e-06, + "loss": 0.1297, + "step": 40865 + }, + { + "epoch": 4.0, + "learning_rate": 8.533351785220038e-06, + "loss": 0.1181, + "step": 40870 + }, + { + "epoch": 4.0, + "learning_rate": 8.52920011071132e-06, + "loss": 0.0939, + "step": 40875 + }, + { + "epoch": 4.0, + "learning_rate": 8.525048436202603e-06, + "loss": 0.0982, + "step": 40880 + }, + { + "epoch": 4.0, + "learning_rate": 8.520896761693884e-06, + "loss": 0.1092, + "step": 40885 + }, + { + "epoch": 4.0, + "learning_rate": 8.516745087185165e-06, + "loss": 0.0883, + "step": 40890 + }, + { + "epoch": 4.0, + "learning_rate": 8.512593412676445e-06, + "loss": 0.0963, + "step": 40895 + }, + { + "epoch": 4.0, + "learning_rate": 8.508441738167728e-06, + "loss": 0.1083, + "step": 40900 + }, + { + "epoch": 4.0, + "learning_rate": 8.50429006365901e-06, + "loss": 0.092, + "step": 40905 + }, + { + "epoch": 4.0, + "learning_rate": 8.500138389150291e-06, + "loss": 0.1068, + "step": 40910 + }, + { + "epoch": 4.0, + "learning_rate": 8.495986714641572e-06, + "loss": 0.0881, + "step": 40915 + }, + { + "epoch": 4.0, + "learning_rate": 8.491835040132853e-06, + "loss": 0.0897, + "step": 40920 + }, + { + "epoch": 4.0, + "learning_rate": 8.487683365624135e-06, + "loss": 0.0941, + "step": 40925 + }, + { + "epoch": 4.0, + "learning_rate": 8.483531691115418e-06, + "loss": 0.0924, + "step": 40930 + }, + { + "epoch": 4.0, + "learning_rate": 8.479380016606698e-06, + "loss": 0.0921, + "step": 40935 + }, + { + "epoch": 4.0, + "learning_rate": 8.475228342097979e-06, + "loss": 0.0953, + "step": 40940 + }, + { + "epoch": 4.0, + "learning_rate": 8.471076667589262e-06, + "loss": 0.1088, + "step": 40945 + }, + { + "epoch": 4.0, + "learning_rate": 8.466924993080542e-06, + "loss": 0.0925, + "step": 40950 + }, + { + "epoch": 4.0, + "learning_rate": 8.462773318571825e-06, + "loss": 0.0816, + "step": 40955 + }, + { + "epoch": 4.01, + "learning_rate": 8.458621644063106e-06, + "loss": 0.0954, + "step": 40960 + }, + { + "epoch": 4.01, + "learning_rate": 8.454469969554386e-06, + "loss": 0.092, + "step": 40965 + }, + { + "epoch": 4.01, + "learning_rate": 8.450318295045669e-06, + "loss": 0.0895, + "step": 40970 + }, + { + "epoch": 4.01, + "learning_rate": 8.44616662053695e-06, + "loss": 0.0948, + "step": 40975 + }, + { + "epoch": 4.01, + "learning_rate": 8.442014946028232e-06, + "loss": 0.0905, + "step": 40980 + }, + { + "epoch": 4.01, + "learning_rate": 8.437863271519513e-06, + "loss": 0.0779, + "step": 40985 + }, + { + "epoch": 4.01, + "learning_rate": 8.433711597010795e-06, + "loss": 0.1046, + "step": 40990 + }, + { + "epoch": 4.01, + "learning_rate": 8.429559922502076e-06, + "loss": 0.1034, + "step": 40995 + }, + { + "epoch": 4.01, + "learning_rate": 8.425408247993357e-06, + "loss": 0.0856, + "step": 41000 + }, + { + "epoch": 4.01, + "eval_cer": 0.05485107671959507, + "eval_loss": 0.22533003985881805, + "eval_runtime": 272.696, + "eval_samples_per_second": 60.03, + "eval_steps_per_second": 1.669, + "eval_wer": 0.14007169769431185, + "step": 41000 + }, + { + "epoch": 4.01, + "learning_rate": 8.42125657348464e-06, + "loss": 0.099, + "step": 41005 + }, + { + "epoch": 4.01, + "learning_rate": 8.41710489897592e-06, + "loss": 0.1047, + "step": 41010 + }, + { + "epoch": 4.01, + "learning_rate": 8.412953224467203e-06, + "loss": 0.0872, + "step": 41015 + }, + { + "epoch": 4.01, + "learning_rate": 8.408801549958483e-06, + "loss": 0.0785, + "step": 41020 + }, + { + "epoch": 4.01, + "learning_rate": 8.404649875449764e-06, + "loss": 0.1087, + "step": 41025 + }, + { + "epoch": 4.01, + "learning_rate": 8.400498200941047e-06, + "loss": 0.1046, + "step": 41030 + }, + { + "epoch": 4.01, + "learning_rate": 8.396346526432329e-06, + "loss": 0.0822, + "step": 41035 + }, + { + "epoch": 4.01, + "learning_rate": 8.39219485192361e-06, + "loss": 0.0918, + "step": 41040 + }, + { + "epoch": 4.01, + "learning_rate": 8.38804317741489e-06, + "loss": 0.1158, + "step": 41045 + }, + { + "epoch": 4.01, + "learning_rate": 8.383891502906171e-06, + "loss": 0.0858, + "step": 41050 + }, + { + "epoch": 4.01, + "learning_rate": 8.379739828397455e-06, + "loss": 0.0798, + "step": 41055 + }, + { + "epoch": 4.01, + "learning_rate": 8.375588153888736e-06, + "loss": 0.1195, + "step": 41060 + }, + { + "epoch": 4.02, + "learning_rate": 8.371436479380017e-06, + "loss": 0.1012, + "step": 41065 + }, + { + "epoch": 4.02, + "learning_rate": 8.367284804871298e-06, + "loss": 0.0825, + "step": 41070 + }, + { + "epoch": 4.02, + "learning_rate": 8.363133130362579e-06, + "loss": 0.0943, + "step": 41075 + }, + { + "epoch": 4.02, + "learning_rate": 8.358981455853863e-06, + "loss": 0.0971, + "step": 41080 + }, + { + "epoch": 4.02, + "learning_rate": 8.354829781345143e-06, + "loss": 0.0817, + "step": 41085 + }, + { + "epoch": 4.02, + "learning_rate": 8.350678106836424e-06, + "loss": 0.0994, + "step": 41090 + }, + { + "epoch": 4.02, + "learning_rate": 8.346526432327705e-06, + "loss": 0.1236, + "step": 41095 + }, + { + "epoch": 4.02, + "learning_rate": 8.342374757818987e-06, + "loss": 0.093, + "step": 41100 + }, + { + "epoch": 4.02, + "learning_rate": 8.338223083310268e-06, + "loss": 0.0895, + "step": 41105 + }, + { + "epoch": 4.02, + "learning_rate": 8.33407140880155e-06, + "loss": 0.1103, + "step": 41110 + }, + { + "epoch": 4.02, + "learning_rate": 8.329919734292831e-06, + "loss": 0.0934, + "step": 41115 + }, + { + "epoch": 4.02, + "learning_rate": 8.325768059784112e-06, + "loss": 0.0891, + "step": 41120 + }, + { + "epoch": 4.02, + "learning_rate": 8.321616385275395e-06, + "loss": 0.0969, + "step": 41125 + }, + { + "epoch": 4.02, + "learning_rate": 8.317464710766675e-06, + "loss": 0.0926, + "step": 41130 + }, + { + "epoch": 4.02, + "learning_rate": 8.313313036257958e-06, + "loss": 0.0841, + "step": 41135 + }, + { + "epoch": 4.02, + "learning_rate": 8.309161361749239e-06, + "loss": 0.1015, + "step": 41140 + }, + { + "epoch": 4.02, + "learning_rate": 8.305009687240521e-06, + "loss": 0.0954, + "step": 41145 + }, + { + "epoch": 4.02, + "learning_rate": 8.300858012731802e-06, + "loss": 0.0957, + "step": 41150 + }, + { + "epoch": 4.02, + "learning_rate": 8.296706338223083e-06, + "loss": 0.092, + "step": 41155 + }, + { + "epoch": 4.02, + "learning_rate": 8.292554663714365e-06, + "loss": 0.1053, + "step": 41160 + }, + { + "epoch": 4.03, + "learning_rate": 8.288402989205648e-06, + "loss": 0.1137, + "step": 41165 + }, + { + "epoch": 4.03, + "learning_rate": 8.284251314696928e-06, + "loss": 0.0825, + "step": 41170 + }, + { + "epoch": 4.03, + "learning_rate": 8.280099640188209e-06, + "loss": 0.112, + "step": 41175 + }, + { + "epoch": 4.03, + "learning_rate": 8.27594796567949e-06, + "loss": 0.0989, + "step": 41180 + }, + { + "epoch": 4.03, + "learning_rate": 8.271796291170772e-06, + "loss": 0.085, + "step": 41185 + }, + { + "epoch": 4.03, + "learning_rate": 8.267644616662055e-06, + "loss": 0.0902, + "step": 41190 + }, + { + "epoch": 4.03, + "learning_rate": 8.263492942153336e-06, + "loss": 0.1081, + "step": 41195 + }, + { + "epoch": 4.03, + "learning_rate": 8.259341267644616e-06, + "loss": 0.0958, + "step": 41200 + }, + { + "epoch": 4.03, + "learning_rate": 8.255189593135897e-06, + "loss": 0.0774, + "step": 41205 + }, + { + "epoch": 4.03, + "learning_rate": 8.251037918627181e-06, + "loss": 0.1119, + "step": 41210 + }, + { + "epoch": 4.03, + "learning_rate": 8.246886244118462e-06, + "loss": 0.098, + "step": 41215 + }, + { + "epoch": 4.03, + "learning_rate": 8.242734569609743e-06, + "loss": 0.0706, + "step": 41220 + }, + { + "epoch": 4.03, + "learning_rate": 8.238582895101024e-06, + "loss": 0.1198, + "step": 41225 + }, + { + "epoch": 4.03, + "learning_rate": 8.234431220592304e-06, + "loss": 0.09, + "step": 41230 + }, + { + "epoch": 4.03, + "learning_rate": 8.230279546083589e-06, + "loss": 0.0943, + "step": 41235 + }, + { + "epoch": 4.03, + "learning_rate": 8.22612787157487e-06, + "loss": 0.0965, + "step": 41240 + }, + { + "epoch": 4.03, + "learning_rate": 8.22197619706615e-06, + "loss": 0.1083, + "step": 41245 + }, + { + "epoch": 4.03, + "learning_rate": 8.21782452255743e-06, + "loss": 0.0865, + "step": 41250 + }, + { + "epoch": 4.03, + "learning_rate": 8.213672848048713e-06, + "loss": 0.0867, + "step": 41255 + }, + { + "epoch": 4.03, + "learning_rate": 8.209521173539996e-06, + "loss": 0.104, + "step": 41260 + }, + { + "epoch": 4.04, + "learning_rate": 8.205369499031277e-06, + "loss": 0.0937, + "step": 41265 + }, + { + "epoch": 4.04, + "learning_rate": 8.201217824522557e-06, + "loss": 0.0745, + "step": 41270 + }, + { + "epoch": 4.04, + "learning_rate": 8.197066150013838e-06, + "loss": 0.0987, + "step": 41275 + }, + { + "epoch": 4.04, + "learning_rate": 8.19291447550512e-06, + "loss": 0.0902, + "step": 41280 + }, + { + "epoch": 4.04, + "learning_rate": 8.188762800996403e-06, + "loss": 0.0861, + "step": 41285 + }, + { + "epoch": 4.04, + "learning_rate": 8.184611126487684e-06, + "loss": 0.0816, + "step": 41290 + }, + { + "epoch": 4.04, + "learning_rate": 8.180459451978965e-06, + "loss": 0.1134, + "step": 41295 + }, + { + "epoch": 4.04, + "learning_rate": 8.176307777470247e-06, + "loss": 0.0863, + "step": 41300 + }, + { + "epoch": 4.04, + "learning_rate": 8.172156102961528e-06, + "loss": 0.0849, + "step": 41305 + }, + { + "epoch": 4.04, + "learning_rate": 8.16800442845281e-06, + "loss": 0.1136, + "step": 41310 + }, + { + "epoch": 4.04, + "learning_rate": 8.163852753944091e-06, + "loss": 0.0849, + "step": 41315 + }, + { + "epoch": 4.04, + "learning_rate": 8.159701079435373e-06, + "loss": 0.0898, + "step": 41320 + }, + { + "epoch": 4.04, + "learning_rate": 8.155549404926654e-06, + "loss": 0.0874, + "step": 41325 + }, + { + "epoch": 4.04, + "learning_rate": 8.151397730417935e-06, + "loss": 0.0955, + "step": 41330 + }, + { + "epoch": 4.04, + "learning_rate": 8.147246055909216e-06, + "loss": 0.0821, + "step": 41335 + }, + { + "epoch": 4.04, + "learning_rate": 8.143094381400498e-06, + "loss": 0.0878, + "step": 41340 + }, + { + "epoch": 4.04, + "learning_rate": 8.13894270689178e-06, + "loss": 0.1178, + "step": 41345 + }, + { + "epoch": 4.04, + "learning_rate": 8.134791032383061e-06, + "loss": 0.0965, + "step": 41350 + }, + { + "epoch": 4.04, + "learning_rate": 8.130639357874342e-06, + "loss": 0.0789, + "step": 41355 + }, + { + "epoch": 4.04, + "learning_rate": 8.126487683365623e-06, + "loss": 0.112, + "step": 41360 + }, + { + "epoch": 4.04, + "learning_rate": 8.122336008856907e-06, + "loss": 0.0855, + "step": 41365 + }, + { + "epoch": 4.05, + "learning_rate": 8.118184334348188e-06, + "loss": 0.0953, + "step": 41370 + }, + { + "epoch": 4.05, + "learning_rate": 8.114032659839469e-06, + "loss": 0.1126, + "step": 41375 + }, + { + "epoch": 4.05, + "learning_rate": 8.10988098533075e-06, + "loss": 0.0877, + "step": 41380 + }, + { + "epoch": 4.05, + "learning_rate": 8.10572931082203e-06, + "loss": 0.0833, + "step": 41385 + }, + { + "epoch": 4.05, + "learning_rate": 8.101577636313314e-06, + "loss": 0.0966, + "step": 41390 + }, + { + "epoch": 4.05, + "learning_rate": 8.097425961804595e-06, + "loss": 0.1123, + "step": 41395 + }, + { + "epoch": 4.05, + "learning_rate": 8.093274287295876e-06, + "loss": 0.0912, + "step": 41400 + }, + { + "epoch": 4.05, + "learning_rate": 8.089122612787157e-06, + "loss": 0.0845, + "step": 41405 + }, + { + "epoch": 4.05, + "learning_rate": 8.084970938278439e-06, + "loss": 0.0958, + "step": 41410 + }, + { + "epoch": 4.05, + "learning_rate": 8.080819263769722e-06, + "loss": 0.0957, + "step": 41415 + }, + { + "epoch": 4.05, + "learning_rate": 8.076667589261002e-06, + "loss": 0.0925, + "step": 41420 + }, + { + "epoch": 4.05, + "learning_rate": 8.072515914752283e-06, + "loss": 0.0958, + "step": 41425 + }, + { + "epoch": 4.05, + "learning_rate": 8.068364240243566e-06, + "loss": 0.0807, + "step": 41430 + }, + { + "epoch": 4.05, + "learning_rate": 8.064212565734846e-06, + "loss": 0.0867, + "step": 41435 + }, + { + "epoch": 4.05, + "learning_rate": 8.060060891226129e-06, + "loss": 0.0958, + "step": 41440 + }, + { + "epoch": 4.05, + "learning_rate": 8.05590921671741e-06, + "loss": 0.1004, + "step": 41445 + }, + { + "epoch": 4.05, + "learning_rate": 8.05175754220869e-06, + "loss": 0.0829, + "step": 41450 + }, + { + "epoch": 4.05, + "learning_rate": 8.047605867699973e-06, + "loss": 0.0926, + "step": 41455 + }, + { + "epoch": 4.05, + "learning_rate": 8.043454193191254e-06, + "loss": 0.1005, + "step": 41460 + }, + { + "epoch": 4.05, + "learning_rate": 8.039302518682536e-06, + "loss": 0.0987, + "step": 41465 + }, + { + "epoch": 4.06, + "learning_rate": 8.035150844173817e-06, + "loss": 0.0908, + "step": 41470 + }, + { + "epoch": 4.06, + "learning_rate": 8.0309991696651e-06, + "loss": 0.1072, + "step": 41475 + }, + { + "epoch": 4.06, + "learning_rate": 8.02684749515638e-06, + "loss": 0.1177, + "step": 41480 + }, + { + "epoch": 4.06, + "learning_rate": 8.02269582064766e-06, + "loss": 0.086, + "step": 41485 + }, + { + "epoch": 4.06, + "learning_rate": 8.018544146138943e-06, + "loss": 0.1012, + "step": 41490 + }, + { + "epoch": 4.06, + "learning_rate": 8.014392471630224e-06, + "loss": 0.1036, + "step": 41495 + }, + { + "epoch": 4.06, + "learning_rate": 8.010240797121507e-06, + "loss": 0.0983, + "step": 41500 + }, + { + "epoch": 4.06, + "eval_cer": 0.054671873952241885, + "eval_loss": 0.22581814229488373, + "eval_runtime": 277.2232, + "eval_samples_per_second": 59.05, + "eval_steps_per_second": 1.641, + "eval_wer": 0.1389420345689976, + "step": 41500 + }, + { + "epoch": 4.06, + "learning_rate": 8.006089122612787e-06, + "loss": 0.0875, + "step": 41505 + }, + { + "epoch": 4.06, + "learning_rate": 8.001937448104068e-06, + "loss": 0.1124, + "step": 41510 + }, + { + "epoch": 4.06, + "learning_rate": 7.99778577359535e-06, + "loss": 0.0862, + "step": 41515 + }, + { + "epoch": 4.06, + "learning_rate": 7.993634099086633e-06, + "loss": 0.0856, + "step": 41520 + }, + { + "epoch": 4.06, + "learning_rate": 7.989482424577914e-06, + "loss": 0.1031, + "step": 41525 + }, + { + "epoch": 4.06, + "learning_rate": 7.985330750069195e-06, + "loss": 0.1067, + "step": 41530 + }, + { + "epoch": 4.06, + "learning_rate": 7.981179075560475e-06, + "loss": 0.0893, + "step": 41535 + }, + { + "epoch": 4.06, + "learning_rate": 7.977027401051758e-06, + "loss": 0.0824, + "step": 41540 + }, + { + "epoch": 4.06, + "learning_rate": 7.97287572654304e-06, + "loss": 0.096, + "step": 41545 + }, + { + "epoch": 4.06, + "learning_rate": 7.968724052034321e-06, + "loss": 0.0868, + "step": 41550 + }, + { + "epoch": 4.06, + "learning_rate": 7.964572377525602e-06, + "loss": 0.0898, + "step": 41555 + }, + { + "epoch": 4.06, + "learning_rate": 7.960420703016883e-06, + "loss": 0.1021, + "step": 41560 + }, + { + "epoch": 4.06, + "learning_rate": 7.956269028508165e-06, + "loss": 0.0945, + "step": 41565 + }, + { + "epoch": 4.06, + "learning_rate": 7.952947688901191e-06, + "loss": 0.0795, + "step": 41570 + }, + { + "epoch": 4.07, + "learning_rate": 7.948796014392472e-06, + "loss": 0.1021, + "step": 41575 + }, + { + "epoch": 4.07, + "learning_rate": 7.944644339883753e-06, + "loss": 0.0913, + "step": 41580 + }, + { + "epoch": 4.07, + "learning_rate": 7.940492665375034e-06, + "loss": 0.0926, + "step": 41585 + }, + { + "epoch": 4.07, + "learning_rate": 7.936340990866318e-06, + "loss": 0.0924, + "step": 41590 + }, + { + "epoch": 4.07, + "learning_rate": 7.932189316357599e-06, + "loss": 0.1018, + "step": 41595 + }, + { + "epoch": 4.07, + "learning_rate": 7.92803764184888e-06, + "loss": 0.0808, + "step": 41600 + }, + { + "epoch": 4.07, + "learning_rate": 7.92388596734016e-06, + "loss": 0.085, + "step": 41605 + }, + { + "epoch": 4.07, + "learning_rate": 7.91973429283144e-06, + "loss": 0.0876, + "step": 41610 + }, + { + "epoch": 4.07, + "learning_rate": 7.915582618322725e-06, + "loss": 0.0913, + "step": 41615 + }, + { + "epoch": 4.07, + "learning_rate": 7.911430943814006e-06, + "loss": 0.0919, + "step": 41620 + }, + { + "epoch": 4.07, + "learning_rate": 7.907279269305287e-06, + "loss": 0.1077, + "step": 41625 + }, + { + "epoch": 4.07, + "learning_rate": 7.903127594796567e-06, + "loss": 0.0858, + "step": 41630 + }, + { + "epoch": 4.07, + "learning_rate": 7.89897592028785e-06, + "loss": 0.0814, + "step": 41635 + }, + { + "epoch": 4.07, + "learning_rate": 7.894824245779132e-06, + "loss": 0.0913, + "step": 41640 + }, + { + "epoch": 4.07, + "learning_rate": 7.890672571270413e-06, + "loss": 0.1123, + "step": 41645 + }, + { + "epoch": 4.07, + "learning_rate": 7.886520896761694e-06, + "loss": 0.0895, + "step": 41650 + }, + { + "epoch": 4.07, + "learning_rate": 7.882369222252975e-06, + "loss": 0.0865, + "step": 41655 + }, + { + "epoch": 4.07, + "learning_rate": 7.878217547744257e-06, + "loss": 0.1194, + "step": 41660 + }, + { + "epoch": 4.07, + "learning_rate": 7.87406587323554e-06, + "loss": 0.1034, + "step": 41665 + }, + { + "epoch": 4.07, + "learning_rate": 7.86991419872682e-06, + "loss": 0.0778, + "step": 41670 + }, + { + "epoch": 4.08, + "learning_rate": 7.865762524218101e-06, + "loss": 0.1145, + "step": 41675 + }, + { + "epoch": 4.08, + "learning_rate": 7.861610849709383e-06, + "loss": 0.0929, + "step": 41680 + }, + { + "epoch": 4.08, + "learning_rate": 7.857459175200664e-06, + "loss": 0.0996, + "step": 41685 + }, + { + "epoch": 4.08, + "learning_rate": 7.853307500691945e-06, + "loss": 0.1008, + "step": 41690 + }, + { + "epoch": 4.08, + "learning_rate": 7.849155826183227e-06, + "loss": 0.1006, + "step": 41695 + }, + { + "epoch": 4.08, + "learning_rate": 7.84500415167451e-06, + "loss": 0.0821, + "step": 41700 + }, + { + "epoch": 4.08, + "learning_rate": 7.84085247716579e-06, + "loss": 0.0875, + "step": 41705 + }, + { + "epoch": 4.08, + "learning_rate": 7.836700802657071e-06, + "loss": 0.1031, + "step": 41710 + }, + { + "epoch": 4.08, + "learning_rate": 7.832549128148352e-06, + "loss": 0.0816, + "step": 41715 + }, + { + "epoch": 4.08, + "learning_rate": 7.828397453639635e-06, + "loss": 0.0931, + "step": 41720 + }, + { + "epoch": 4.08, + "learning_rate": 7.824245779130917e-06, + "loss": 0.1166, + "step": 41725 + }, + { + "epoch": 4.08, + "learning_rate": 7.820094104622198e-06, + "loss": 0.0975, + "step": 41730 + }, + { + "epoch": 4.08, + "learning_rate": 7.815942430113479e-06, + "loss": 0.1007, + "step": 41735 + }, + { + "epoch": 4.08, + "learning_rate": 7.81179075560476e-06, + "loss": 0.1102, + "step": 41740 + }, + { + "epoch": 4.08, + "learning_rate": 7.807639081096044e-06, + "loss": 0.1145, + "step": 41745 + }, + { + "epoch": 4.08, + "learning_rate": 7.803487406587324e-06, + "loss": 0.0963, + "step": 41750 + }, + { + "epoch": 4.08, + "learning_rate": 7.799335732078605e-06, + "loss": 0.088, + "step": 41755 + }, + { + "epoch": 4.08, + "learning_rate": 7.795184057569886e-06, + "loss": 0.1113, + "step": 41760 + }, + { + "epoch": 4.08, + "learning_rate": 7.791032383061167e-06, + "loss": 0.1011, + "step": 41765 + }, + { + "epoch": 4.08, + "learning_rate": 7.78688070855245e-06, + "loss": 0.0915, + "step": 41770 + }, + { + "epoch": 4.08, + "learning_rate": 7.782729034043732e-06, + "loss": 0.1001, + "step": 41775 + }, + { + "epoch": 4.09, + "learning_rate": 7.778577359535012e-06, + "loss": 0.0947, + "step": 41780 + }, + { + "epoch": 4.09, + "learning_rate": 7.774425685026293e-06, + "loss": 0.085, + "step": 41785 + }, + { + "epoch": 4.09, + "learning_rate": 7.770274010517576e-06, + "loss": 0.0888, + "step": 41790 + }, + { + "epoch": 4.09, + "learning_rate": 7.766122336008858e-06, + "loss": 0.1037, + "step": 41795 + }, + { + "epoch": 4.09, + "learning_rate": 7.761970661500139e-06, + "loss": 0.0745, + "step": 41800 + }, + { + "epoch": 4.09, + "learning_rate": 7.75781898699142e-06, + "loss": 0.0907, + "step": 41805 + }, + { + "epoch": 4.09, + "learning_rate": 7.753667312482702e-06, + "loss": 0.1019, + "step": 41810 + }, + { + "epoch": 4.09, + "learning_rate": 7.749515637973983e-06, + "loss": 0.0972, + "step": 41815 + }, + { + "epoch": 4.09, + "learning_rate": 7.745363963465265e-06, + "loss": 0.086, + "step": 41820 + }, + { + "epoch": 4.09, + "learning_rate": 7.741212288956546e-06, + "loss": 0.1248, + "step": 41825 + }, + { + "epoch": 4.09, + "learning_rate": 7.737060614447827e-06, + "loss": 0.1085, + "step": 41830 + }, + { + "epoch": 4.09, + "learning_rate": 7.73290893993911e-06, + "loss": 0.0901, + "step": 41835 + }, + { + "epoch": 4.09, + "learning_rate": 7.72875726543039e-06, + "loss": 0.081, + "step": 41840 + }, + { + "epoch": 4.09, + "learning_rate": 7.724605590921673e-06, + "loss": 0.1079, + "step": 41845 + }, + { + "epoch": 4.09, + "learning_rate": 7.720453916412953e-06, + "loss": 0.0984, + "step": 41850 + }, + { + "epoch": 4.09, + "learning_rate": 7.716302241904236e-06, + "loss": 0.0893, + "step": 41855 + }, + { + "epoch": 4.09, + "learning_rate": 7.712150567395517e-06, + "loss": 0.0986, + "step": 41860 + }, + { + "epoch": 4.09, + "learning_rate": 7.707998892886797e-06, + "loss": 0.0865, + "step": 41865 + }, + { + "epoch": 4.09, + "learning_rate": 7.70384721837808e-06, + "loss": 0.092, + "step": 41870 + }, + { + "epoch": 4.09, + "learning_rate": 7.69969554386936e-06, + "loss": 0.0969, + "step": 41875 + }, + { + "epoch": 4.1, + "learning_rate": 7.695543869360643e-06, + "loss": 0.1033, + "step": 41880 + }, + { + "epoch": 4.1, + "learning_rate": 7.691392194851924e-06, + "loss": 0.0854, + "step": 41885 + }, + { + "epoch": 4.1, + "learning_rate": 7.687240520343205e-06, + "loss": 0.0919, + "step": 41890 + }, + { + "epoch": 4.1, + "learning_rate": 7.683088845834487e-06, + "loss": 0.1063, + "step": 41895 + }, + { + "epoch": 4.1, + "learning_rate": 7.67893717132577e-06, + "loss": 0.0899, + "step": 41900 + }, + { + "epoch": 4.1, + "learning_rate": 7.67478549681705e-06, + "loss": 0.0838, + "step": 41905 + }, + { + "epoch": 4.1, + "learning_rate": 7.670633822308331e-06, + "loss": 0.1079, + "step": 41910 + }, + { + "epoch": 4.1, + "learning_rate": 7.666482147799612e-06, + "loss": 0.0879, + "step": 41915 + }, + { + "epoch": 4.1, + "learning_rate": 7.662330473290894e-06, + "loss": 0.0883, + "step": 41920 + }, + { + "epoch": 4.1, + "learning_rate": 7.658178798782177e-06, + "loss": 0.1072, + "step": 41925 + }, + { + "epoch": 4.1, + "learning_rate": 7.654027124273457e-06, + "loss": 0.1057, + "step": 41930 + }, + { + "epoch": 4.1, + "learning_rate": 7.649875449764738e-06, + "loss": 0.085, + "step": 41935 + }, + { + "epoch": 4.1, + "learning_rate": 7.645723775256019e-06, + "loss": 0.093, + "step": 41940 + }, + { + "epoch": 4.1, + "learning_rate": 7.641572100747301e-06, + "loss": 0.0955, + "step": 41945 + }, + { + "epoch": 4.1, + "learning_rate": 7.637420426238584e-06, + "loss": 0.0919, + "step": 41950 + }, + { + "epoch": 4.1, + "learning_rate": 7.633268751729865e-06, + "loss": 0.0938, + "step": 41955 + }, + { + "epoch": 4.1, + "learning_rate": 7.629117077221145e-06, + "loss": 0.1212, + "step": 41960 + }, + { + "epoch": 4.1, + "learning_rate": 7.624965402712428e-06, + "loss": 0.0781, + "step": 41965 + }, + { + "epoch": 4.1, + "learning_rate": 7.6208137282037095e-06, + "loss": 0.0813, + "step": 41970 + }, + { + "epoch": 4.1, + "learning_rate": 7.61666205369499e-06, + "loss": 0.1086, + "step": 41975 + }, + { + "epoch": 4.1, + "learning_rate": 7.612510379186272e-06, + "loss": 0.1036, + "step": 41980 + }, + { + "epoch": 4.11, + "learning_rate": 7.608358704677553e-06, + "loss": 0.0853, + "step": 41985 + }, + { + "epoch": 4.11, + "learning_rate": 7.604207030168835e-06, + "loss": 0.0919, + "step": 41990 + }, + { + "epoch": 4.11, + "learning_rate": 7.600055355660117e-06, + "loss": 0.105, + "step": 41995 + }, + { + "epoch": 4.11, + "learning_rate": 7.5959036811513975e-06, + "loss": 0.0893, + "step": 42000 + }, + { + "epoch": 4.11, + "eval_cer": 0.05474471120606931, + "eval_loss": 0.22598466277122498, + "eval_runtime": 273.8634, + "eval_samples_per_second": 59.774, + "eval_steps_per_second": 1.661, + "eval_wer": 0.14056796588809153, + "step": 42000 + }, + { + "epoch": 4.11, + "learning_rate": 7.591752006642679e-06, + "loss": 0.0967, + "step": 42005 + }, + { + "epoch": 4.11, + "learning_rate": 7.587600332133962e-06, + "loss": 0.095, + "step": 42010 + }, + { + "epoch": 4.11, + "learning_rate": 7.583448657625242e-06, + "loss": 0.0867, + "step": 42015 + }, + { + "epoch": 4.11, + "learning_rate": 7.579296983116524e-06, + "loss": 0.0868, + "step": 42020 + }, + { + "epoch": 4.11, + "learning_rate": 7.575145308607805e-06, + "loss": 0.1038, + "step": 42025 + }, + { + "epoch": 4.11, + "learning_rate": 7.570993634099088e-06, + "loss": 0.0927, + "step": 42030 + }, + { + "epoch": 4.11, + "learning_rate": 7.566841959590369e-06, + "loss": 0.0829, + "step": 42035 + }, + { + "epoch": 4.11, + "learning_rate": 7.5626902850816496e-06, + "loss": 0.0958, + "step": 42040 + }, + { + "epoch": 4.11, + "learning_rate": 7.558538610572931e-06, + "loss": 0.1103, + "step": 42045 + }, + { + "epoch": 4.11, + "learning_rate": 7.554386936064212e-06, + "loss": 0.0864, + "step": 42050 + }, + { + "epoch": 4.11, + "learning_rate": 7.550235261555494e-06, + "loss": 0.0804, + "step": 42055 + }, + { + "epoch": 4.11, + "learning_rate": 7.546083587046776e-06, + "loss": 0.1111, + "step": 42060 + }, + { + "epoch": 4.11, + "learning_rate": 7.5427622474398015e-06, + "loss": 0.088, + "step": 42065 + }, + { + "epoch": 4.11, + "learning_rate": 7.538610572931082e-06, + "loss": 0.0914, + "step": 42070 + }, + { + "epoch": 4.11, + "learning_rate": 7.534458898422363e-06, + "loss": 0.1027, + "step": 42075 + }, + { + "epoch": 4.11, + "learning_rate": 7.530307223913646e-06, + "loss": 0.0784, + "step": 42080 + }, + { + "epoch": 4.12, + "learning_rate": 7.526155549404927e-06, + "loss": 0.1, + "step": 42085 + }, + { + "epoch": 4.12, + "learning_rate": 7.522003874896209e-06, + "loss": 0.098, + "step": 42090 + }, + { + "epoch": 4.12, + "learning_rate": 7.5178522003874895e-06, + "loss": 0.1013, + "step": 42095 + }, + { + "epoch": 4.12, + "learning_rate": 7.51370052587877e-06, + "loss": 0.0832, + "step": 42100 + }, + { + "epoch": 4.12, + "learning_rate": 7.5095488513700536e-06, + "loss": 0.0886, + "step": 42105 + }, + { + "epoch": 4.12, + "learning_rate": 7.505397176861334e-06, + "loss": 0.0979, + "step": 42110 + }, + { + "epoch": 4.12, + "learning_rate": 7.501245502352615e-06, + "loss": 0.085, + "step": 42115 + }, + { + "epoch": 4.12, + "learning_rate": 7.4970938278438976e-06, + "loss": 0.0809, + "step": 42120 + }, + { + "epoch": 4.12, + "learning_rate": 7.492942153335178e-06, + "loss": 0.1062, + "step": 42125 + }, + { + "epoch": 4.12, + "learning_rate": 7.488790478826461e-06, + "loss": 0.1046, + "step": 42130 + }, + { + "epoch": 4.12, + "learning_rate": 7.4846388043177416e-06, + "loss": 0.1015, + "step": 42135 + }, + { + "epoch": 4.12, + "learning_rate": 7.480487129809023e-06, + "loss": 0.0987, + "step": 42140 + }, + { + "epoch": 4.12, + "learning_rate": 7.476335455300305e-06, + "loss": 0.1126, + "step": 42145 + }, + { + "epoch": 4.12, + "learning_rate": 7.4721837807915856e-06, + "loss": 0.0999, + "step": 42150 + }, + { + "epoch": 4.12, + "learning_rate": 7.468032106282868e-06, + "loss": 0.0837, + "step": 42155 + }, + { + "epoch": 4.12, + "learning_rate": 7.463880431774149e-06, + "loss": 0.1169, + "step": 42160 + }, + { + "epoch": 4.12, + "learning_rate": 7.45972875726543e-06, + "loss": 0.0938, + "step": 42165 + }, + { + "epoch": 4.12, + "learning_rate": 7.455577082756712e-06, + "loss": 0.0856, + "step": 42170 + }, + { + "epoch": 4.12, + "learning_rate": 7.451425408247994e-06, + "loss": 0.1065, + "step": 42175 + }, + { + "epoch": 4.12, + "learning_rate": 7.447273733739275e-06, + "loss": 0.0995, + "step": 42180 + }, + { + "epoch": 4.12, + "learning_rate": 7.443122059230557e-06, + "loss": 0.0946, + "step": 42185 + }, + { + "epoch": 4.13, + "learning_rate": 7.438970384721838e-06, + "loss": 0.0949, + "step": 42190 + }, + { + "epoch": 4.13, + "learning_rate": 7.43481871021312e-06, + "loss": 0.1196, + "step": 42195 + }, + { + "epoch": 4.13, + "learning_rate": 7.430667035704401e-06, + "loss": 0.0735, + "step": 42200 + }, + { + "epoch": 4.13, + "learning_rate": 7.4265153611956825e-06, + "loss": 0.0806, + "step": 42205 + }, + { + "epoch": 4.13, + "learning_rate": 7.422363686686964e-06, + "loss": 0.1042, + "step": 42210 + }, + { + "epoch": 4.13, + "learning_rate": 7.418212012178245e-06, + "loss": 0.0886, + "step": 42215 + }, + { + "epoch": 4.13, + "learning_rate": 7.414060337669527e-06, + "loss": 0.0913, + "step": 42220 + }, + { + "epoch": 4.13, + "learning_rate": 7.409908663160808e-06, + "loss": 0.1048, + "step": 42225 + }, + { + "epoch": 4.13, + "learning_rate": 7.40575698865209e-06, + "loss": 0.0923, + "step": 42230 + }, + { + "epoch": 4.13, + "learning_rate": 7.401605314143371e-06, + "loss": 0.0794, + "step": 42235 + }, + { + "epoch": 4.13, + "learning_rate": 7.397453639634653e-06, + "loss": 0.0823, + "step": 42240 + }, + { + "epoch": 4.13, + "learning_rate": 7.3933019651259346e-06, + "loss": 0.1114, + "step": 42245 + }, + { + "epoch": 4.13, + "learning_rate": 7.389150290617216e-06, + "loss": 0.0947, + "step": 42250 + }, + { + "epoch": 4.13, + "learning_rate": 7.384998616108497e-06, + "loss": 0.0929, + "step": 42255 + }, + { + "epoch": 4.13, + "learning_rate": 7.3808469415997786e-06, + "loss": 0.1075, + "step": 42260 + }, + { + "epoch": 4.13, + "learning_rate": 7.37669526709106e-06, + "loss": 0.0739, + "step": 42265 + }, + { + "epoch": 4.13, + "learning_rate": 7.372543592582342e-06, + "loss": 0.0858, + "step": 42270 + }, + { + "epoch": 4.13, + "learning_rate": 7.368391918073623e-06, + "loss": 0.0898, + "step": 42275 + }, + { + "epoch": 4.13, + "learning_rate": 7.364240243564904e-06, + "loss": 0.0992, + "step": 42280 + }, + { + "epoch": 4.13, + "learning_rate": 7.360088569056187e-06, + "loss": 0.0852, + "step": 42285 + }, + { + "epoch": 4.14, + "learning_rate": 7.355936894547467e-06, + "loss": 0.0909, + "step": 42290 + }, + { + "epoch": 4.14, + "learning_rate": 7.35178522003875e-06, + "loss": 0.127, + "step": 42295 + }, + { + "epoch": 4.14, + "learning_rate": 7.347633545530031e-06, + "loss": 0.1033, + "step": 42300 + }, + { + "epoch": 4.14, + "learning_rate": 7.343481871021312e-06, + "loss": 0.0952, + "step": 42305 + }, + { + "epoch": 4.14, + "learning_rate": 7.339330196512594e-06, + "loss": 0.1068, + "step": 42310 + }, + { + "epoch": 4.14, + "learning_rate": 7.335178522003875e-06, + "loss": 0.087, + "step": 42315 + }, + { + "epoch": 4.14, + "learning_rate": 7.331026847495156e-06, + "loss": 0.0819, + "step": 42320 + }, + { + "epoch": 4.14, + "learning_rate": 7.326875172986438e-06, + "loss": 0.1144, + "step": 42325 + }, + { + "epoch": 4.14, + "learning_rate": 7.3227234984777195e-06, + "loss": 0.0851, + "step": 42330 + }, + { + "epoch": 4.14, + "learning_rate": 7.318571823969001e-06, + "loss": 0.0791, + "step": 42335 + }, + { + "epoch": 4.14, + "learning_rate": 7.314420149460283e-06, + "loss": 0.0813, + "step": 42340 + }, + { + "epoch": 4.14, + "learning_rate": 7.3102684749515635e-06, + "loss": 0.0932, + "step": 42345 + }, + { + "epoch": 4.14, + "learning_rate": 7.306116800442846e-06, + "loss": 0.0828, + "step": 42350 + }, + { + "epoch": 4.14, + "learning_rate": 7.301965125934127e-06, + "loss": 0.0805, + "step": 42355 + }, + { + "epoch": 4.14, + "learning_rate": 7.297813451425409e-06, + "loss": 0.1007, + "step": 42360 + }, + { + "epoch": 4.14, + "learning_rate": 7.29366177691669e-06, + "loss": 0.0902, + "step": 42365 + }, + { + "epoch": 4.14, + "learning_rate": 7.289510102407971e-06, + "loss": 0.0866, + "step": 42370 + }, + { + "epoch": 4.14, + "learning_rate": 7.285358427899253e-06, + "loss": 0.106, + "step": 42375 + }, + { + "epoch": 4.14, + "learning_rate": 7.281206753390534e-06, + "loss": 0.0908, + "step": 42380 + }, + { + "epoch": 4.14, + "learning_rate": 7.277055078881816e-06, + "loss": 0.0862, + "step": 42385 + }, + { + "epoch": 4.15, + "learning_rate": 7.272903404373097e-06, + "loss": 0.0893, + "step": 42390 + }, + { + "epoch": 4.15, + "learning_rate": 7.268751729864379e-06, + "loss": 0.1154, + "step": 42395 + }, + { + "epoch": 4.15, + "learning_rate": 7.26460005535566e-06, + "loss": 0.0889, + "step": 42400 + }, + { + "epoch": 4.15, + "learning_rate": 7.260448380846942e-06, + "loss": 0.0895, + "step": 42405 + }, + { + "epoch": 4.15, + "learning_rate": 7.256296706338224e-06, + "loss": 0.1167, + "step": 42410 + }, + { + "epoch": 4.15, + "learning_rate": 7.252145031829504e-06, + "loss": 0.0821, + "step": 42415 + }, + { + "epoch": 4.15, + "learning_rate": 7.247993357320786e-06, + "loss": 0.0846, + "step": 42420 + }, + { + "epoch": 4.15, + "learning_rate": 7.243841682812068e-06, + "loss": 0.1066, + "step": 42425 + }, + { + "epoch": 4.15, + "learning_rate": 7.239690008303349e-06, + "loss": 0.0958, + "step": 42430 + }, + { + "epoch": 4.15, + "learning_rate": 7.23553833379463e-06, + "loss": 0.0922, + "step": 42435 + }, + { + "epoch": 4.15, + "learning_rate": 7.2313866592859125e-06, + "loss": 0.0747, + "step": 42440 + }, + { + "epoch": 4.15, + "learning_rate": 7.227234984777193e-06, + "loss": 0.1088, + "step": 42445 + }, + { + "epoch": 4.15, + "learning_rate": 7.223083310268476e-06, + "loss": 0.0904, + "step": 42450 + }, + { + "epoch": 4.15, + "learning_rate": 7.2189316357597565e-06, + "loss": 0.0885, + "step": 42455 + }, + { + "epoch": 4.15, + "learning_rate": 7.214779961251038e-06, + "loss": 0.0975, + "step": 42460 + }, + { + "epoch": 4.15, + "learning_rate": 7.21062828674232e-06, + "loss": 0.1032, + "step": 42465 + }, + { + "epoch": 4.15, + "learning_rate": 7.2064766122336005e-06, + "loss": 0.0879, + "step": 42470 + }, + { + "epoch": 4.15, + "learning_rate": 7.202324937724883e-06, + "loss": 0.1058, + "step": 42475 + }, + { + "epoch": 4.15, + "learning_rate": 7.198173263216164e-06, + "loss": 0.099, + "step": 42480 + }, + { + "epoch": 4.15, + "learning_rate": 7.194021588707445e-06, + "loss": 0.0793, + "step": 42485 + }, + { + "epoch": 4.15, + "learning_rate": 7.189869914198727e-06, + "loss": 0.0856, + "step": 42490 + }, + { + "epoch": 4.16, + "learning_rate": 7.1857182396900086e-06, + "loss": 0.103, + "step": 42495 + }, + { + "epoch": 4.16, + "learning_rate": 7.18156656518129e-06, + "loss": 0.0892, + "step": 42500 + }, + { + "epoch": 4.16, + "eval_cer": 0.054352777411664596, + "eval_loss": 0.22715312242507935, + "eval_runtime": 325.4426, + "eval_samples_per_second": 50.301, + "eval_steps_per_second": 1.398, + "eval_wer": 0.1391052806853725, + "step": 42500 + }, + { + "epoch": 4.16, + "learning_rate": 7.177414890672572e-06, + "loss": 0.0808, + "step": 42505 + }, + { + "epoch": 4.16, + "learning_rate": 7.1732632161638526e-06, + "loss": 0.109, + "step": 42510 + }, + { + "epoch": 4.16, + "learning_rate": 7.169111541655135e-06, + "loss": 0.0898, + "step": 42515 + }, + { + "epoch": 4.16, + "learning_rate": 7.164959867146416e-06, + "loss": 0.0828, + "step": 42520 + }, + { + "epoch": 4.16, + "learning_rate": 7.1608081926376966e-06, + "loss": 0.105, + "step": 42525 + }, + { + "epoch": 4.16, + "learning_rate": 7.156656518128979e-06, + "loss": 0.1015, + "step": 42530 + }, + { + "epoch": 4.16, + "learning_rate": 7.15250484362026e-06, + "loss": 0.078, + "step": 42535 + }, + { + "epoch": 4.16, + "learning_rate": 7.148353169111542e-06, + "loss": 0.0855, + "step": 42540 + }, + { + "epoch": 4.16, + "learning_rate": 7.144201494602823e-06, + "loss": 0.0949, + "step": 42545 + }, + { + "epoch": 4.16, + "learning_rate": 7.140049820094105e-06, + "loss": 0.081, + "step": 42550 + }, + { + "epoch": 4.16, + "learning_rate": 7.135898145585386e-06, + "loss": 0.0866, + "step": 42555 + }, + { + "epoch": 4.16, + "learning_rate": 7.131746471076668e-06, + "loss": 0.1048, + "step": 42560 + }, + { + "epoch": 4.16, + "learning_rate": 7.1275947965679495e-06, + "loss": 0.0901, + "step": 42565 + }, + { + "epoch": 4.16, + "learning_rate": 7.123443122059231e-06, + "loss": 0.0938, + "step": 42570 + }, + { + "epoch": 4.16, + "learning_rate": 7.119291447550512e-06, + "loss": 0.0907, + "step": 42575 + }, + { + "epoch": 4.16, + "learning_rate": 7.1151397730417935e-06, + "loss": 0.0945, + "step": 42580 + }, + { + "epoch": 4.16, + "learning_rate": 7.110988098533075e-06, + "loss": 0.0907, + "step": 42585 + }, + { + "epoch": 4.16, + "learning_rate": 7.106836424024357e-06, + "loss": 0.082, + "step": 42590 + }, + { + "epoch": 4.17, + "learning_rate": 7.102684749515638e-06, + "loss": 0.1162, + "step": 42595 + }, + { + "epoch": 4.17, + "learning_rate": 7.098533075006919e-06, + "loss": 0.0815, + "step": 42600 + }, + { + "epoch": 4.17, + "learning_rate": 7.0943814004982016e-06, + "loss": 0.0891, + "step": 42605 + }, + { + "epoch": 4.17, + "learning_rate": 7.090229725989482e-06, + "loss": 0.101, + "step": 42610 + }, + { + "epoch": 4.17, + "learning_rate": 7.086078051480765e-06, + "loss": 0.0947, + "step": 42615 + }, + { + "epoch": 4.17, + "learning_rate": 7.0819263769720456e-06, + "loss": 0.0823, + "step": 42620 + }, + { + "epoch": 4.17, + "learning_rate": 7.077774702463327e-06, + "loss": 0.0983, + "step": 42625 + }, + { + "epoch": 4.17, + "learning_rate": 7.073623027954609e-06, + "loss": 0.0908, + "step": 42630 + }, + { + "epoch": 4.17, + "learning_rate": 7.0694713534458896e-06, + "loss": 0.0741, + "step": 42635 + }, + { + "epoch": 4.17, + "learning_rate": 7.065319678937171e-06, + "loss": 0.0975, + "step": 42640 + }, + { + "epoch": 4.17, + "learning_rate": 7.061168004428453e-06, + "loss": 0.1115, + "step": 42645 + }, + { + "epoch": 4.17, + "learning_rate": 7.057016329919734e-06, + "loss": 0.0837, + "step": 42650 + }, + { + "epoch": 4.17, + "learning_rate": 7.052864655411016e-06, + "loss": 0.0928, + "step": 42655 + }, + { + "epoch": 4.17, + "learning_rate": 7.048712980902298e-06, + "loss": 0.1051, + "step": 42660 + }, + { + "epoch": 4.17, + "learning_rate": 7.044561306393578e-06, + "loss": 0.0983, + "step": 42665 + }, + { + "epoch": 4.17, + "learning_rate": 7.040409631884861e-06, + "loss": 0.0885, + "step": 42670 + }, + { + "epoch": 4.17, + "learning_rate": 7.036257957376142e-06, + "loss": 0.102, + "step": 42675 + }, + { + "epoch": 4.17, + "learning_rate": 7.032106282867424e-06, + "loss": 0.0875, + "step": 42680 + }, + { + "epoch": 4.17, + "learning_rate": 7.027954608358705e-06, + "loss": 0.0705, + "step": 42685 + }, + { + "epoch": 4.17, + "learning_rate": 7.023802933849986e-06, + "loss": 0.0902, + "step": 42690 + }, + { + "epoch": 4.17, + "learning_rate": 7.019651259341268e-06, + "loss": 0.1088, + "step": 42695 + }, + { + "epoch": 4.18, + "learning_rate": 7.015499584832549e-06, + "loss": 0.0844, + "step": 42700 + }, + { + "epoch": 4.18, + "learning_rate": 7.011347910323831e-06, + "loss": 0.0899, + "step": 42705 + }, + { + "epoch": 4.18, + "learning_rate": 7.007196235815112e-06, + "loss": 0.1076, + "step": 42710 + }, + { + "epoch": 4.18, + "learning_rate": 7.003044561306394e-06, + "loss": 0.0903, + "step": 42715 + }, + { + "epoch": 4.18, + "learning_rate": 6.998892886797675e-06, + "loss": 0.0809, + "step": 42720 + }, + { + "epoch": 4.18, + "learning_rate": 6.994741212288957e-06, + "loss": 0.1046, + "step": 42725 + }, + { + "epoch": 4.18, + "learning_rate": 6.990589537780238e-06, + "loss": 0.0895, + "step": 42730 + }, + { + "epoch": 4.18, + "learning_rate": 6.98643786327152e-06, + "loss": 0.0905, + "step": 42735 + }, + { + "epoch": 4.18, + "learning_rate": 6.982286188762801e-06, + "loss": 0.1066, + "step": 42740 + }, + { + "epoch": 4.18, + "learning_rate": 6.9781345142540826e-06, + "loss": 0.107, + "step": 42745 + }, + { + "epoch": 4.18, + "learning_rate": 6.973982839745364e-06, + "loss": 0.1062, + "step": 42750 + }, + { + "epoch": 4.18, + "learning_rate": 6.969831165236645e-06, + "loss": 0.0876, + "step": 42755 + }, + { + "epoch": 4.18, + "learning_rate": 6.965679490727927e-06, + "loss": 0.1025, + "step": 42760 + }, + { + "epoch": 4.18, + "learning_rate": 6.961527816219208e-06, + "loss": 0.0874, + "step": 42765 + }, + { + "epoch": 4.18, + "learning_rate": 6.957376141710491e-06, + "loss": 0.0844, + "step": 42770 + }, + { + "epoch": 4.18, + "learning_rate": 6.953224467201771e-06, + "loss": 0.0929, + "step": 42775 + }, + { + "epoch": 4.18, + "learning_rate": 6.949072792693053e-06, + "loss": 0.0953, + "step": 42780 + }, + { + "epoch": 4.18, + "learning_rate": 6.944921118184335e-06, + "loss": 0.0709, + "step": 42785 + }, + { + "epoch": 4.18, + "learning_rate": 6.940769443675616e-06, + "loss": 0.0865, + "step": 42790 + }, + { + "epoch": 4.18, + "learning_rate": 6.936617769166898e-06, + "loss": 0.1152, + "step": 42795 + }, + { + "epoch": 4.19, + "learning_rate": 6.932466094658179e-06, + "loss": 0.0947, + "step": 42800 + }, + { + "epoch": 4.19, + "learning_rate": 6.92831442014946e-06, + "loss": 0.0946, + "step": 42805 + }, + { + "epoch": 4.19, + "learning_rate": 6.924162745640742e-06, + "loss": 0.1169, + "step": 42810 + }, + { + "epoch": 4.19, + "learning_rate": 6.9200110711320235e-06, + "loss": 0.0927, + "step": 42815 + }, + { + "epoch": 4.19, + "learning_rate": 6.915859396623305e-06, + "loss": 0.0848, + "step": 42820 + }, + { + "epoch": 4.19, + "learning_rate": 6.911707722114587e-06, + "loss": 0.0986, + "step": 42825 + }, + { + "epoch": 4.19, + "learning_rate": 6.9075560476058675e-06, + "loss": 0.103, + "step": 42830 + }, + { + "epoch": 4.19, + "learning_rate": 6.90340437309715e-06, + "loss": 0.0887, + "step": 42835 + }, + { + "epoch": 4.19, + "learning_rate": 6.899252698588431e-06, + "loss": 0.0918, + "step": 42840 + }, + { + "epoch": 4.19, + "learning_rate": 6.895101024079712e-06, + "loss": 0.1054, + "step": 42845 + }, + { + "epoch": 4.19, + "learning_rate": 6.890949349570994e-06, + "loss": 0.0863, + "step": 42850 + }, + { + "epoch": 4.19, + "learning_rate": 6.886797675062275e-06, + "loss": 0.0825, + "step": 42855 + }, + { + "epoch": 4.19, + "learning_rate": 6.882646000553557e-06, + "loss": 0.0925, + "step": 42860 + }, + { + "epoch": 4.19, + "learning_rate": 6.878494326044838e-06, + "loss": 0.0898, + "step": 42865 + }, + { + "epoch": 4.19, + "learning_rate": 6.8743426515361196e-06, + "loss": 0.0886, + "step": 42870 + }, + { + "epoch": 4.19, + "learning_rate": 6.870190977027401e-06, + "loss": 0.0925, + "step": 42875 + }, + { + "epoch": 4.19, + "learning_rate": 6.866039302518683e-06, + "loss": 0.0868, + "step": 42880 + }, + { + "epoch": 4.19, + "learning_rate": 6.861887628009964e-06, + "loss": 0.0859, + "step": 42885 + }, + { + "epoch": 4.19, + "learning_rate": 6.857735953501246e-06, + "loss": 0.0821, + "step": 42890 + }, + { + "epoch": 4.19, + "learning_rate": 6.853584278992527e-06, + "loss": 0.1206, + "step": 42895 + }, + { + "epoch": 4.19, + "learning_rate": 6.849432604483809e-06, + "loss": 0.0916, + "step": 42900 + }, + { + "epoch": 4.2, + "learning_rate": 6.84528092997509e-06, + "loss": 0.0666, + "step": 42905 + }, + { + "epoch": 4.2, + "learning_rate": 6.841129255466372e-06, + "loss": 0.1187, + "step": 42910 + }, + { + "epoch": 4.2, + "learning_rate": 6.836977580957653e-06, + "loss": 0.0847, + "step": 42915 + }, + { + "epoch": 4.2, + "learning_rate": 6.832825906448934e-06, + "loss": 0.0747, + "step": 42920 + }, + { + "epoch": 4.2, + "learning_rate": 6.8286742319402165e-06, + "loss": 0.0987, + "step": 42925 + }, + { + "epoch": 4.2, + "learning_rate": 6.824522557431497e-06, + "loss": 0.1092, + "step": 42930 + }, + { + "epoch": 4.2, + "learning_rate": 6.820370882922779e-06, + "loss": 0.0905, + "step": 42935 + }, + { + "epoch": 4.2, + "learning_rate": 6.8162192084140605e-06, + "loss": 0.0942, + "step": 42940 + }, + { + "epoch": 4.2, + "learning_rate": 6.812067533905342e-06, + "loss": 0.0982, + "step": 42945 + }, + { + "epoch": 4.2, + "learning_rate": 6.807915859396624e-06, + "loss": 0.0795, + "step": 42950 + }, + { + "epoch": 4.2, + "learning_rate": 6.803764184887905e-06, + "loss": 0.0912, + "step": 42955 + }, + { + "epoch": 4.2, + "learning_rate": 6.799612510379186e-06, + "loss": 0.1256, + "step": 42960 + }, + { + "epoch": 4.2, + "learning_rate": 6.795460835870468e-06, + "loss": 0.0849, + "step": 42965 + }, + { + "epoch": 4.2, + "learning_rate": 6.791309161361749e-06, + "loss": 0.0831, + "step": 42970 + }, + { + "epoch": 4.2, + "learning_rate": 6.787157486853031e-06, + "loss": 0.0889, + "step": 42975 + }, + { + "epoch": 4.2, + "learning_rate": 6.7830058123443126e-06, + "loss": 0.108, + "step": 42980 + }, + { + "epoch": 4.2, + "learning_rate": 6.778854137835593e-06, + "loss": 0.0877, + "step": 42985 + }, + { + "epoch": 4.2, + "learning_rate": 6.774702463326876e-06, + "loss": 0.0792, + "step": 42990 + }, + { + "epoch": 4.2, + "learning_rate": 6.7705507888181566e-06, + "loss": 0.1056, + "step": 42995 + }, + { + "epoch": 4.2, + "learning_rate": 6.766399114309439e-06, + "loss": 0.0761, + "step": 43000 + }, + { + "epoch": 4.2, + "eval_cer": 0.05470308991816792, + "eval_loss": 0.2300744205713272, + "eval_runtime": 282.9313, + "eval_samples_per_second": 57.859, + "eval_steps_per_second": 1.608, + "eval_wer": 0.13961460856846217, + "step": 43000 + }, + { + "epoch": 4.21, + "learning_rate": 6.76224743980072e-06, + "loss": 0.0806, + "step": 43005 + }, + { + "epoch": 4.21, + "learning_rate": 6.758095765292001e-06, + "loss": 0.1033, + "step": 43010 + }, + { + "epoch": 4.21, + "learning_rate": 6.753944090783283e-06, + "loss": 0.0889, + "step": 43015 + }, + { + "epoch": 4.21, + "learning_rate": 6.749792416274564e-06, + "loss": 0.0739, + "step": 43020 + }, + { + "epoch": 4.21, + "learning_rate": 6.745640741765846e-06, + "loss": 0.1175, + "step": 43025 + }, + { + "epoch": 4.21, + "learning_rate": 6.741489067257127e-06, + "loss": 0.0938, + "step": 43030 + }, + { + "epoch": 4.21, + "learning_rate": 6.737337392748409e-06, + "loss": 0.0872, + "step": 43035 + }, + { + "epoch": 4.21, + "learning_rate": 6.73318571823969e-06, + "loss": 0.0769, + "step": 43040 + }, + { + "epoch": 4.21, + "learning_rate": 6.729034043730972e-06, + "loss": 0.1149, + "step": 43045 + }, + { + "epoch": 4.21, + "learning_rate": 6.724882369222253e-06, + "loss": 0.0866, + "step": 43050 + }, + { + "epoch": 4.21, + "learning_rate": 6.720730694713535e-06, + "loss": 0.0811, + "step": 43055 + }, + { + "epoch": 4.21, + "learning_rate": 6.716579020204816e-06, + "loss": 0.1252, + "step": 43060 + }, + { + "epoch": 4.21, + "learning_rate": 6.712427345696098e-06, + "loss": 0.0999, + "step": 43065 + }, + { + "epoch": 4.21, + "learning_rate": 6.708275671187379e-06, + "loss": 0.0744, + "step": 43070 + }, + { + "epoch": 4.21, + "learning_rate": 6.70412399667866e-06, + "loss": 0.0949, + "step": 43075 + }, + { + "epoch": 4.21, + "learning_rate": 6.699972322169942e-06, + "loss": 0.1107, + "step": 43080 + }, + { + "epoch": 4.21, + "learning_rate": 6.695820647661223e-06, + "loss": 0.0864, + "step": 43085 + }, + { + "epoch": 4.21, + "learning_rate": 6.6916689731525056e-06, + "loss": 0.0761, + "step": 43090 + }, + { + "epoch": 4.21, + "learning_rate": 6.687517298643786e-06, + "loss": 0.0997, + "step": 43095 + }, + { + "epoch": 4.21, + "learning_rate": 6.683365624135068e-06, + "loss": 0.0879, + "step": 43100 + }, + { + "epoch": 4.21, + "learning_rate": 6.6792139496263496e-06, + "loss": 0.0919, + "step": 43105 + }, + { + "epoch": 4.22, + "learning_rate": 6.675062275117631e-06, + "loss": 0.1082, + "step": 43110 + }, + { + "epoch": 4.22, + "learning_rate": 6.670910600608913e-06, + "loss": 0.0858, + "step": 43115 + }, + { + "epoch": 4.22, + "learning_rate": 6.666758926100194e-06, + "loss": 0.087, + "step": 43120 + }, + { + "epoch": 4.22, + "learning_rate": 6.662607251591475e-06, + "loss": 0.1026, + "step": 43125 + }, + { + "epoch": 4.22, + "learning_rate": 6.658455577082757e-06, + "loss": 0.0965, + "step": 43130 + }, + { + "epoch": 4.22, + "learning_rate": 6.654303902574038e-06, + "loss": 0.0875, + "step": 43135 + }, + { + "epoch": 4.22, + "learning_rate": 6.650152228065319e-06, + "loss": 0.0993, + "step": 43140 + }, + { + "epoch": 4.22, + "learning_rate": 6.646000553556602e-06, + "loss": 0.1157, + "step": 43145 + }, + { + "epoch": 4.22, + "learning_rate": 6.641848879047882e-06, + "loss": 0.0829, + "step": 43150 + }, + { + "epoch": 4.22, + "learning_rate": 6.637697204539165e-06, + "loss": 0.0881, + "step": 43155 + }, + { + "epoch": 4.22, + "learning_rate": 6.633545530030446e-06, + "loss": 0.1019, + "step": 43160 + }, + { + "epoch": 4.22, + "learning_rate": 6.629393855521727e-06, + "loss": 0.0926, + "step": 43165 + }, + { + "epoch": 4.22, + "learning_rate": 6.625242181013009e-06, + "loss": 0.083, + "step": 43170 + }, + { + "epoch": 4.22, + "learning_rate": 6.62109050650429e-06, + "loss": 0.1109, + "step": 43175 + }, + { + "epoch": 4.22, + "learning_rate": 6.616938831995572e-06, + "loss": 0.1061, + "step": 43180 + }, + { + "epoch": 4.22, + "learning_rate": 6.612787157486853e-06, + "loss": 0.0966, + "step": 43185 + }, + { + "epoch": 4.22, + "learning_rate": 6.6086354829781345e-06, + "loss": 0.0893, + "step": 43190 + }, + { + "epoch": 4.22, + "learning_rate": 6.604483808469416e-06, + "loss": 0.1054, + "step": 43195 + }, + { + "epoch": 4.22, + "learning_rate": 6.600332133960698e-06, + "loss": 0.0734, + "step": 43200 + }, + { + "epoch": 4.22, + "learning_rate": 6.596180459451979e-06, + "loss": 0.0894, + "step": 43205 + }, + { + "epoch": 4.23, + "learning_rate": 6.592028784943261e-06, + "loss": 0.0872, + "step": 43210 + }, + { + "epoch": 4.23, + "learning_rate": 6.587877110434542e-06, + "loss": 0.0829, + "step": 43215 + }, + { + "epoch": 4.23, + "learning_rate": 6.583725435925824e-06, + "loss": 0.0895, + "step": 43220 + }, + { + "epoch": 4.23, + "learning_rate": 6.579573761417105e-06, + "loss": 0.1109, + "step": 43225 + }, + { + "epoch": 4.23, + "learning_rate": 6.5754220869083866e-06, + "loss": 0.0973, + "step": 43230 + }, + { + "epoch": 4.23, + "learning_rate": 6.571270412399668e-06, + "loss": 0.0879, + "step": 43235 + }, + { + "epoch": 4.23, + "learning_rate": 6.567118737890949e-06, + "loss": 0.0877, + "step": 43240 + }, + { + "epoch": 4.23, + "learning_rate": 6.562967063382231e-06, + "loss": 0.1004, + "step": 43245 + }, + { + "epoch": 4.23, + "learning_rate": 6.558815388873512e-06, + "loss": 0.0821, + "step": 43250 + }, + { + "epoch": 4.23, + "learning_rate": 6.554663714364794e-06, + "loss": 0.0967, + "step": 43255 + }, + { + "epoch": 4.23, + "learning_rate": 6.550512039856075e-06, + "loss": 0.1032, + "step": 43260 + }, + { + "epoch": 4.23, + "learning_rate": 6.546360365347357e-06, + "loss": 0.0849, + "step": 43265 + }, + { + "epoch": 4.23, + "learning_rate": 6.542208690838639e-06, + "loss": 0.0768, + "step": 43270 + }, + { + "epoch": 4.23, + "learning_rate": 6.53805701632992e-06, + "loss": 0.1074, + "step": 43275 + }, + { + "epoch": 4.23, + "learning_rate": 6.533905341821201e-06, + "loss": 0.0954, + "step": 43280 + }, + { + "epoch": 4.23, + "learning_rate": 6.529753667312483e-06, + "loss": 0.0826, + "step": 43285 + }, + { + "epoch": 4.23, + "learning_rate": 6.525601992803764e-06, + "loss": 0.0944, + "step": 43290 + }, + { + "epoch": 4.23, + "learning_rate": 6.521450318295046e-06, + "loss": 0.1114, + "step": 43295 + }, + { + "epoch": 4.23, + "learning_rate": 6.5172986437863275e-06, + "loss": 0.0806, + "step": 43300 + }, + { + "epoch": 4.23, + "learning_rate": 6.513146969277608e-06, + "loss": 0.0815, + "step": 43305 + }, + { + "epoch": 4.24, + "learning_rate": 6.508995294768891e-06, + "loss": 0.1148, + "step": 43310 + }, + { + "epoch": 4.24, + "learning_rate": 6.5048436202601715e-06, + "loss": 0.0899, + "step": 43315 + }, + { + "epoch": 4.24, + "learning_rate": 6.500691945751454e-06, + "loss": 0.0876, + "step": 43320 + }, + { + "epoch": 4.24, + "learning_rate": 6.496540271242735e-06, + "loss": 0.103, + "step": 43325 + }, + { + "epoch": 4.24, + "learning_rate": 6.492388596734016e-06, + "loss": 0.1028, + "step": 43330 + }, + { + "epoch": 4.24, + "learning_rate": 6.488236922225298e-06, + "loss": 0.079, + "step": 43335 + }, + { + "epoch": 4.24, + "learning_rate": 6.484085247716579e-06, + "loss": 0.101, + "step": 43340 + }, + { + "epoch": 4.24, + "learning_rate": 6.47993357320786e-06, + "loss": 0.1068, + "step": 43345 + }, + { + "epoch": 4.24, + "learning_rate": 6.475781898699142e-06, + "loss": 0.0919, + "step": 43350 + }, + { + "epoch": 4.24, + "learning_rate": 6.4716302241904235e-06, + "loss": 0.0768, + "step": 43355 + }, + { + "epoch": 4.24, + "learning_rate": 6.467478549681705e-06, + "loss": 0.1141, + "step": 43360 + }, + { + "epoch": 4.24, + "learning_rate": 6.463326875172987e-06, + "loss": 0.1059, + "step": 43365 + }, + { + "epoch": 4.24, + "learning_rate": 6.4591752006642675e-06, + "loss": 0.0737, + "step": 43370 + }, + { + "epoch": 4.24, + "learning_rate": 6.45502352615555e-06, + "loss": 0.1111, + "step": 43375 + }, + { + "epoch": 4.24, + "learning_rate": 6.450871851646831e-06, + "loss": 0.0877, + "step": 43380 + }, + { + "epoch": 4.24, + "learning_rate": 6.446720177138113e-06, + "loss": 0.0911, + "step": 43385 + }, + { + "epoch": 4.24, + "learning_rate": 6.442568502629394e-06, + "loss": 0.0808, + "step": 43390 + }, + { + "epoch": 4.24, + "learning_rate": 6.438416828120675e-06, + "loss": 0.1126, + "step": 43395 + }, + { + "epoch": 4.24, + "learning_rate": 6.434265153611957e-06, + "loss": 0.0951, + "step": 43400 + }, + { + "epoch": 4.24, + "learning_rate": 6.430113479103238e-06, + "loss": 0.0743, + "step": 43405 + }, + { + "epoch": 4.24, + "learning_rate": 6.4259618045945205e-06, + "loss": 0.1105, + "step": 43410 + }, + { + "epoch": 4.25, + "learning_rate": 6.421810130085801e-06, + "loss": 0.0884, + "step": 43415 + }, + { + "epoch": 4.25, + "learning_rate": 6.417658455577083e-06, + "loss": 0.0935, + "step": 43420 + }, + { + "epoch": 4.25, + "learning_rate": 6.4135067810683645e-06, + "loss": 0.0995, + "step": 43425 + }, + { + "epoch": 4.25, + "learning_rate": 6.409355106559646e-06, + "loss": 0.0964, + "step": 43430 + }, + { + "epoch": 4.25, + "learning_rate": 6.405203432050928e-06, + "loss": 0.0748, + "step": 43435 + }, + { + "epoch": 4.25, + "learning_rate": 6.401051757542209e-06, + "loss": 0.0955, + "step": 43440 + }, + { + "epoch": 4.25, + "learning_rate": 6.39690008303349e-06, + "loss": 0.097, + "step": 43445 + }, + { + "epoch": 4.25, + "learning_rate": 6.392748408524772e-06, + "loss": 0.0895, + "step": 43450 + }, + { + "epoch": 4.25, + "learning_rate": 6.388596734016053e-06, + "loss": 0.0838, + "step": 43455 + }, + { + "epoch": 4.25, + "learning_rate": 6.384445059507334e-06, + "loss": 0.1212, + "step": 43460 + }, + { + "epoch": 4.25, + "learning_rate": 6.3802933849986165e-06, + "loss": 0.0917, + "step": 43465 + }, + { + "epoch": 4.25, + "learning_rate": 6.376141710489897e-06, + "loss": 0.0897, + "step": 43470 + }, + { + "epoch": 4.25, + "learning_rate": 6.37199003598118e-06, + "loss": 0.0955, + "step": 43475 + }, + { + "epoch": 4.25, + "learning_rate": 6.3678383614724605e-06, + "loss": 0.0951, + "step": 43480 + }, + { + "epoch": 4.25, + "learning_rate": 6.363686686963742e-06, + "loss": 0.0869, + "step": 43485 + }, + { + "epoch": 4.25, + "learning_rate": 6.359535012455024e-06, + "loss": 0.0828, + "step": 43490 + }, + { + "epoch": 4.25, + "learning_rate": 6.355383337946305e-06, + "loss": 0.0929, + "step": 43495 + }, + { + "epoch": 4.25, + "learning_rate": 6.351231663437587e-06, + "loss": 0.0931, + "step": 43500 + }, + { + "epoch": 4.25, + "eval_cer": 0.053844072781758776, + "eval_loss": 0.22590665519237518, + "eval_runtime": 279.6258, + "eval_samples_per_second": 58.543, + "eval_steps_per_second": 1.627, + "eval_wer": 0.13765565517196346, + "step": 43500 + }, + { + "epoch": 4.25, + "learning_rate": 6.347079988928868e-06, + "loss": 0.0841, + "step": 43505 + }, + { + "epoch": 4.25, + "learning_rate": 6.342928314420149e-06, + "loss": 0.1102, + "step": 43510 + }, + { + "epoch": 4.26, + "learning_rate": 6.338776639911431e-06, + "loss": 0.0825, + "step": 43515 + }, + { + "epoch": 4.26, + "learning_rate": 6.334624965402713e-06, + "loss": 0.0822, + "step": 43520 + }, + { + "epoch": 4.26, + "learning_rate": 6.330473290893994e-06, + "loss": 0.1155, + "step": 43525 + }, + { + "epoch": 4.26, + "learning_rate": 6.326321616385276e-06, + "loss": 0.0825, + "step": 43530 + }, + { + "epoch": 4.26, + "learning_rate": 6.322169941876557e-06, + "loss": 0.0947, + "step": 43535 + }, + { + "epoch": 4.26, + "learning_rate": 6.318018267367839e-06, + "loss": 0.1014, + "step": 43540 + }, + { + "epoch": 4.26, + "learning_rate": 6.31386659285912e-06, + "loss": 0.1063, + "step": 43545 + }, + { + "epoch": 4.26, + "learning_rate": 6.3097149183504015e-06, + "loss": 0.0987, + "step": 43550 + }, + { + "epoch": 4.26, + "learning_rate": 6.305563243841683e-06, + "loss": 0.0883, + "step": 43555 + }, + { + "epoch": 4.26, + "learning_rate": 6.301411569332964e-06, + "loss": 0.0926, + "step": 43560 + }, + { + "epoch": 4.26, + "learning_rate": 6.297259894824246e-06, + "loss": 0.0815, + "step": 43565 + }, + { + "epoch": 4.26, + "learning_rate": 6.293108220315527e-06, + "loss": 0.0685, + "step": 43570 + }, + { + "epoch": 4.26, + "learning_rate": 6.288956545806809e-06, + "loss": 0.0919, + "step": 43575 + }, + { + "epoch": 4.26, + "learning_rate": 6.28480487129809e-06, + "loss": 0.096, + "step": 43580 + }, + { + "epoch": 4.26, + "learning_rate": 6.280653196789372e-06, + "loss": 0.0771, + "step": 43585 + }, + { + "epoch": 4.26, + "learning_rate": 6.2765015222806535e-06, + "loss": 0.0926, + "step": 43590 + }, + { + "epoch": 4.26, + "learning_rate": 6.272349847771935e-06, + "loss": 0.1, + "step": 43595 + }, + { + "epoch": 4.26, + "learning_rate": 6.268198173263216e-06, + "loss": 0.0865, + "step": 43600 + }, + { + "epoch": 4.26, + "learning_rate": 6.264046498754498e-06, + "loss": 0.0877, + "step": 43605 + }, + { + "epoch": 4.26, + "learning_rate": 6.259894824245779e-06, + "loss": 0.1082, + "step": 43610 + }, + { + "epoch": 4.26, + "learning_rate": 6.255743149737061e-06, + "loss": 0.0873, + "step": 43615 + }, + { + "epoch": 4.27, + "learning_rate": 6.251591475228342e-06, + "loss": 0.0935, + "step": 43620 + }, + { + "epoch": 4.27, + "learning_rate": 6.247439800719623e-06, + "loss": 0.0887, + "step": 43625 + }, + { + "epoch": 4.27, + "learning_rate": 6.243288126210906e-06, + "loss": 0.1035, + "step": 43630 + }, + { + "epoch": 4.27, + "learning_rate": 6.239136451702186e-06, + "loss": 0.0829, + "step": 43635 + }, + { + "epoch": 4.27, + "learning_rate": 6.234984777193469e-06, + "loss": 0.0848, + "step": 43640 + }, + { + "epoch": 4.27, + "learning_rate": 6.23083310268475e-06, + "loss": 0.0935, + "step": 43645 + }, + { + "epoch": 4.27, + "learning_rate": 6.226681428176031e-06, + "loss": 0.0853, + "step": 43650 + }, + { + "epoch": 4.27, + "learning_rate": 6.222529753667313e-06, + "loss": 0.1, + "step": 43655 + }, + { + "epoch": 4.27, + "learning_rate": 6.2183780791585945e-06, + "loss": 0.1061, + "step": 43660 + }, + { + "epoch": 4.27, + "learning_rate": 6.214226404649875e-06, + "loss": 0.0977, + "step": 43665 + }, + { + "epoch": 4.27, + "learning_rate": 6.210074730141157e-06, + "loss": 0.0811, + "step": 43670 + }, + { + "epoch": 4.27, + "learning_rate": 6.2059230556324385e-06, + "loss": 0.0971, + "step": 43675 + }, + { + "epoch": 4.27, + "learning_rate": 6.20177138112372e-06, + "loss": 0.0961, + "step": 43680 + }, + { + "epoch": 4.27, + "learning_rate": 6.197619706615002e-06, + "loss": 0.0957, + "step": 43685 + }, + { + "epoch": 4.27, + "learning_rate": 6.1934680321062825e-06, + "loss": 0.0825, + "step": 43690 + }, + { + "epoch": 4.27, + "learning_rate": 6.189316357597565e-06, + "loss": 0.107, + "step": 43695 + }, + { + "epoch": 4.27, + "learning_rate": 6.185164683088846e-06, + "loss": 0.0893, + "step": 43700 + }, + { + "epoch": 4.27, + "learning_rate": 6.181013008580128e-06, + "loss": 0.0937, + "step": 43705 + }, + { + "epoch": 4.27, + "learning_rate": 6.176861334071409e-06, + "loss": 0.1189, + "step": 43710 + }, + { + "epoch": 4.27, + "learning_rate": 6.1727096595626905e-06, + "loss": 0.0983, + "step": 43715 + }, + { + "epoch": 4.28, + "learning_rate": 6.168557985053972e-06, + "loss": 0.1028, + "step": 43720 + }, + { + "epoch": 4.28, + "learning_rate": 6.164406310545253e-06, + "loss": 0.098, + "step": 43725 + }, + { + "epoch": 4.28, + "learning_rate": 6.160254636036535e-06, + "loss": 0.0903, + "step": 43730 + }, + { + "epoch": 4.28, + "learning_rate": 6.156102961527816e-06, + "loss": 0.0835, + "step": 43735 + }, + { + "epoch": 4.28, + "learning_rate": 6.151951287019098e-06, + "loss": 0.079, + "step": 43740 + }, + { + "epoch": 4.28, + "learning_rate": 6.147799612510379e-06, + "loss": 0.1069, + "step": 43745 + }, + { + "epoch": 4.28, + "learning_rate": 6.143647938001661e-06, + "loss": 0.0948, + "step": 43750 + }, + { + "epoch": 4.28, + "learning_rate": 6.139496263492942e-06, + "loss": 0.0888, + "step": 43755 + }, + { + "epoch": 4.28, + "learning_rate": 6.135344588984224e-06, + "loss": 0.0941, + "step": 43760 + }, + { + "epoch": 4.28, + "learning_rate": 6.131192914475505e-06, + "loss": 0.078, + "step": 43765 + }, + { + "epoch": 4.28, + "learning_rate": 6.1270412399667875e-06, + "loss": 0.0746, + "step": 43770 + }, + { + "epoch": 4.28, + "learning_rate": 6.122889565458068e-06, + "loss": 0.0909, + "step": 43775 + }, + { + "epoch": 4.28, + "learning_rate": 6.118737890949349e-06, + "loss": 0.0858, + "step": 43780 + }, + { + "epoch": 4.28, + "learning_rate": 6.1145862164406315e-06, + "loss": 0.0889, + "step": 43785 + }, + { + "epoch": 4.28, + "learning_rate": 6.110434541931912e-06, + "loss": 0.0884, + "step": 43790 + }, + { + "epoch": 4.28, + "learning_rate": 6.106282867423195e-06, + "loss": 0.1173, + "step": 43795 + }, + { + "epoch": 4.28, + "learning_rate": 6.1021311929144755e-06, + "loss": 0.0826, + "step": 43800 + }, + { + "epoch": 4.28, + "learning_rate": 6.097979518405757e-06, + "loss": 0.0818, + "step": 43805 + }, + { + "epoch": 4.28, + "learning_rate": 6.093827843897039e-06, + "loss": 0.113, + "step": 43810 + }, + { + "epoch": 4.28, + "learning_rate": 6.08967616938832e-06, + "loss": 0.0915, + "step": 43815 + }, + { + "epoch": 4.28, + "learning_rate": 6.085524494879602e-06, + "loss": 0.0809, + "step": 43820 + }, + { + "epoch": 4.29, + "learning_rate": 6.0813728203708835e-06, + "loss": 0.1025, + "step": 43825 + }, + { + "epoch": 4.29, + "learning_rate": 6.077221145862164e-06, + "loss": 0.09, + "step": 43830 + }, + { + "epoch": 4.29, + "learning_rate": 6.073069471353446e-06, + "loss": 0.0894, + "step": 43835 + }, + { + "epoch": 4.29, + "learning_rate": 6.0689177968447275e-06, + "loss": 0.0868, + "step": 43840 + }, + { + "epoch": 4.29, + "learning_rate": 6.064766122336009e-06, + "loss": 0.1141, + "step": 43845 + }, + { + "epoch": 4.29, + "learning_rate": 6.060614447827291e-06, + "loss": 0.085, + "step": 43850 + }, + { + "epoch": 4.29, + "learning_rate": 6.0564627733185715e-06, + "loss": 0.0936, + "step": 43855 + }, + { + "epoch": 4.29, + "learning_rate": 6.052311098809854e-06, + "loss": 0.1116, + "step": 43860 + }, + { + "epoch": 4.29, + "learning_rate": 6.048159424301135e-06, + "loss": 0.0835, + "step": 43865 + }, + { + "epoch": 4.29, + "learning_rate": 6.044007749792416e-06, + "loss": 0.0831, + "step": 43870 + }, + { + "epoch": 4.29, + "learning_rate": 6.039856075283698e-06, + "loss": 0.112, + "step": 43875 + }, + { + "epoch": 4.29, + "learning_rate": 6.035704400774979e-06, + "loss": 0.0941, + "step": 43880 + }, + { + "epoch": 4.29, + "learning_rate": 6.031552726266261e-06, + "loss": 0.0712, + "step": 43885 + }, + { + "epoch": 4.29, + "learning_rate": 6.027401051757542e-06, + "loss": 0.0944, + "step": 43890 + }, + { + "epoch": 4.29, + "learning_rate": 6.023249377248824e-06, + "loss": 0.0978, + "step": 43895 + }, + { + "epoch": 4.29, + "learning_rate": 6.019097702740105e-06, + "loss": 0.0859, + "step": 43900 + }, + { + "epoch": 4.29, + "learning_rate": 6.014946028231387e-06, + "loss": 0.0788, + "step": 43905 + }, + { + "epoch": 4.29, + "learning_rate": 6.0107943537226685e-06, + "loss": 0.1001, + "step": 43910 + }, + { + "epoch": 4.29, + "learning_rate": 6.00664267921395e-06, + "loss": 0.0793, + "step": 43915 + }, + { + "epoch": 4.29, + "learning_rate": 6.002491004705231e-06, + "loss": 0.0801, + "step": 43920 + }, + { + "epoch": 4.3, + "learning_rate": 5.998339330196513e-06, + "loss": 0.1026, + "step": 43925 + }, + { + "epoch": 4.3, + "learning_rate": 5.994187655687794e-06, + "loss": 0.086, + "step": 43930 + }, + { + "epoch": 4.3, + "learning_rate": 5.990035981179076e-06, + "loss": 0.0911, + "step": 43935 + }, + { + "epoch": 4.3, + "learning_rate": 5.985884306670357e-06, + "loss": 0.0837, + "step": 43940 + }, + { + "epoch": 4.3, + "learning_rate": 5.981732632161638e-06, + "loss": 0.0922, + "step": 43945 + }, + { + "epoch": 4.3, + "learning_rate": 5.9775809576529205e-06, + "loss": 0.0843, + "step": 43950 + }, + { + "epoch": 4.3, + "learning_rate": 5.973429283144201e-06, + "loss": 0.1019, + "step": 43955 + }, + { + "epoch": 4.3, + "learning_rate": 5.969277608635483e-06, + "loss": 0.1075, + "step": 43960 + }, + { + "epoch": 4.3, + "learning_rate": 5.9651259341267645e-06, + "loss": 0.089, + "step": 43965 + }, + { + "epoch": 4.3, + "learning_rate": 5.960974259618046e-06, + "loss": 0.0853, + "step": 43970 + }, + { + "epoch": 4.3, + "learning_rate": 5.956822585109328e-06, + "loss": 0.1116, + "step": 43975 + }, + { + "epoch": 4.3, + "learning_rate": 5.952670910600609e-06, + "loss": 0.0981, + "step": 43980 + }, + { + "epoch": 4.3, + "learning_rate": 5.94851923609189e-06, + "loss": 0.0856, + "step": 43985 + }, + { + "epoch": 4.3, + "learning_rate": 5.944367561583172e-06, + "loss": 0.0994, + "step": 43990 + }, + { + "epoch": 4.3, + "learning_rate": 5.940215887074453e-06, + "loss": 0.1001, + "step": 43995 + }, + { + "epoch": 4.3, + "learning_rate": 5.936064212565735e-06, + "loss": 0.081, + "step": 44000 + }, + { + "epoch": 4.3, + "eval_cer": 0.05402443169599811, + "eval_loss": 0.22213901579380035, + "eval_runtime": 278.704, + "eval_samples_per_second": 58.736, + "eval_steps_per_second": 1.633, + "eval_wer": 0.13885061674382768, + "step": 44000 + }, + { + "epoch": 4.3, + "learning_rate": 5.931912538057017e-06, + "loss": 0.0932, + "step": 44005 + }, + { + "epoch": 4.3, + "learning_rate": 5.927760863548297e-06, + "loss": 0.1099, + "step": 44010 + }, + { + "epoch": 4.3, + "learning_rate": 5.92360918903958e-06, + "loss": 0.0799, + "step": 44015 + }, + { + "epoch": 4.3, + "learning_rate": 5.919457514530861e-06, + "loss": 0.089, + "step": 44020 + }, + { + "epoch": 4.3, + "learning_rate": 5.915305840022143e-06, + "loss": 0.1162, + "step": 44025 + }, + { + "epoch": 4.31, + "learning_rate": 5.911154165513424e-06, + "loss": 0.0912, + "step": 44030 + }, + { + "epoch": 4.31, + "learning_rate": 5.9070024910047055e-06, + "loss": 0.0849, + "step": 44035 + }, + { + "epoch": 4.31, + "learning_rate": 5.902850816495987e-06, + "loss": 0.0942, + "step": 44040 + }, + { + "epoch": 4.31, + "learning_rate": 5.898699141987268e-06, + "loss": 0.1094, + "step": 44045 + }, + { + "epoch": 4.31, + "learning_rate": 5.89454746747855e-06, + "loss": 0.0825, + "step": 44050 + }, + { + "epoch": 4.31, + "learning_rate": 5.890395792969831e-06, + "loss": 0.0783, + "step": 44055 + }, + { + "epoch": 4.31, + "learning_rate": 5.886244118461113e-06, + "loss": 0.1066, + "step": 44060 + }, + { + "epoch": 4.31, + "learning_rate": 5.882092443952394e-06, + "loss": 0.0861, + "step": 44065 + }, + { + "epoch": 4.31, + "learning_rate": 5.877940769443676e-06, + "loss": 0.0968, + "step": 44070 + }, + { + "epoch": 4.31, + "learning_rate": 5.873789094934957e-06, + "loss": 0.1076, + "step": 44075 + }, + { + "epoch": 4.31, + "learning_rate": 5.869637420426239e-06, + "loss": 0.0863, + "step": 44080 + }, + { + "epoch": 4.31, + "learning_rate": 5.86548574591752e-06, + "loss": 0.0779, + "step": 44085 + }, + { + "epoch": 4.31, + "learning_rate": 5.861334071408802e-06, + "loss": 0.0883, + "step": 44090 + }, + { + "epoch": 4.31, + "learning_rate": 5.857182396900083e-06, + "loss": 0.1073, + "step": 44095 + }, + { + "epoch": 4.31, + "learning_rate": 5.853030722391364e-06, + "loss": 0.0791, + "step": 44100 + }, + { + "epoch": 4.31, + "learning_rate": 5.848879047882646e-06, + "loss": 0.0836, + "step": 44105 + }, + { + "epoch": 4.31, + "learning_rate": 5.844727373373927e-06, + "loss": 0.094, + "step": 44110 + }, + { + "epoch": 4.31, + "learning_rate": 5.84057569886521e-06, + "loss": 0.086, + "step": 44115 + }, + { + "epoch": 4.31, + "learning_rate": 5.83642402435649e-06, + "loss": 0.0847, + "step": 44120 + }, + { + "epoch": 4.31, + "learning_rate": 5.832272349847772e-06, + "loss": 0.085, + "step": 44125 + }, + { + "epoch": 4.32, + "learning_rate": 5.828120675339054e-06, + "loss": 0.0859, + "step": 44130 + }, + { + "epoch": 4.32, + "learning_rate": 5.823969000830335e-06, + "loss": 0.0894, + "step": 44135 + }, + { + "epoch": 4.32, + "learning_rate": 5.819817326321617e-06, + "loss": 0.0823, + "step": 44140 + }, + { + "epoch": 4.32, + "learning_rate": 5.8156656518128985e-06, + "loss": 0.0976, + "step": 44145 + }, + { + "epoch": 4.32, + "learning_rate": 5.811513977304179e-06, + "loss": 0.0873, + "step": 44150 + }, + { + "epoch": 4.32, + "learning_rate": 5.807362302795461e-06, + "loss": 0.0833, + "step": 44155 + }, + { + "epoch": 4.32, + "learning_rate": 5.8032106282867425e-06, + "loss": 0.0945, + "step": 44160 + }, + { + "epoch": 4.32, + "learning_rate": 5.799058953778023e-06, + "loss": 0.0969, + "step": 44165 + }, + { + "epoch": 4.32, + "learning_rate": 5.794907279269306e-06, + "loss": 0.0783, + "step": 44170 + }, + { + "epoch": 4.32, + "learning_rate": 5.7907556047605865e-06, + "loss": 0.0975, + "step": 44175 + }, + { + "epoch": 4.32, + "learning_rate": 5.786603930251869e-06, + "loss": 0.1033, + "step": 44180 + }, + { + "epoch": 4.32, + "learning_rate": 5.78245225574315e-06, + "loss": 0.0976, + "step": 44185 + }, + { + "epoch": 4.32, + "learning_rate": 5.778300581234431e-06, + "loss": 0.0925, + "step": 44190 + }, + { + "epoch": 4.32, + "learning_rate": 5.774148906725713e-06, + "loss": 0.0999, + "step": 44195 + }, + { + "epoch": 4.32, + "learning_rate": 5.7699972322169945e-06, + "loss": 0.0941, + "step": 44200 + }, + { + "epoch": 4.32, + "learning_rate": 5.765845557708276e-06, + "loss": 0.0944, + "step": 44205 + }, + { + "epoch": 4.32, + "learning_rate": 5.761693883199557e-06, + "loss": 0.1044, + "step": 44210 + }, + { + "epoch": 4.32, + "learning_rate": 5.7575422086908385e-06, + "loss": 0.0906, + "step": 44215 + }, + { + "epoch": 4.32, + "learning_rate": 5.75339053418212e-06, + "loss": 0.0777, + "step": 44220 + }, + { + "epoch": 4.32, + "learning_rate": 5.749238859673402e-06, + "loss": 0.107, + "step": 44225 + }, + { + "epoch": 4.32, + "learning_rate": 5.745087185164683e-06, + "loss": 0.0921, + "step": 44230 + }, + { + "epoch": 4.33, + "learning_rate": 5.740935510655965e-06, + "loss": 0.0781, + "step": 44235 + }, + { + "epoch": 4.33, + "learning_rate": 5.736783836147246e-06, + "loss": 0.0876, + "step": 44240 + }, + { + "epoch": 4.33, + "learning_rate": 5.732632161638528e-06, + "loss": 0.0951, + "step": 44245 + }, + { + "epoch": 4.33, + "learning_rate": 5.728480487129809e-06, + "loss": 0.0807, + "step": 44250 + }, + { + "epoch": 4.33, + "learning_rate": 5.7243288126210915e-06, + "loss": 0.0819, + "step": 44255 + }, + { + "epoch": 4.33, + "learning_rate": 5.720177138112372e-06, + "loss": 0.1025, + "step": 44260 + }, + { + "epoch": 4.33, + "learning_rate": 5.716025463603653e-06, + "loss": 0.0984, + "step": 44265 + }, + { + "epoch": 4.33, + "learning_rate": 5.7118737890949355e-06, + "loss": 0.074, + "step": 44270 + }, + { + "epoch": 4.33, + "learning_rate": 5.707722114586216e-06, + "loss": 0.0885, + "step": 44275 + }, + { + "epoch": 4.33, + "learning_rate": 5.703570440077498e-06, + "loss": 0.1001, + "step": 44280 + }, + { + "epoch": 4.33, + "learning_rate": 5.6994187655687795e-06, + "loss": 0.0855, + "step": 44285 + }, + { + "epoch": 4.33, + "learning_rate": 5.695267091060061e-06, + "loss": 0.0877, + "step": 44290 + }, + { + "epoch": 4.33, + "learning_rate": 5.691115416551343e-06, + "loss": 0.0986, + "step": 44295 + }, + { + "epoch": 4.33, + "learning_rate": 5.686963742042624e-06, + "loss": 0.0806, + "step": 44300 + }, + { + "epoch": 4.33, + "learning_rate": 5.682812067533905e-06, + "loss": 0.0772, + "step": 44305 + }, + { + "epoch": 4.33, + "learning_rate": 5.6786603930251875e-06, + "loss": 0.1008, + "step": 44310 + }, + { + "epoch": 4.33, + "learning_rate": 5.674508718516468e-06, + "loss": 0.0841, + "step": 44315 + }, + { + "epoch": 4.33, + "learning_rate": 5.67035704400775e-06, + "loss": 0.0764, + "step": 44320 + }, + { + "epoch": 4.33, + "learning_rate": 5.6662053694990315e-06, + "loss": 0.1026, + "step": 44325 + }, + { + "epoch": 4.33, + "learning_rate": 5.662053694990312e-06, + "loss": 0.0732, + "step": 44330 + }, + { + "epoch": 4.34, + "learning_rate": 5.657902020481595e-06, + "loss": 0.0704, + "step": 44335 + }, + { + "epoch": 4.34, + "learning_rate": 5.6537503459728755e-06, + "loss": 0.0734, + "step": 44340 + }, + { + "epoch": 4.34, + "learning_rate": 5.649598671464158e-06, + "loss": 0.0953, + "step": 44345 + }, + { + "epoch": 4.34, + "learning_rate": 5.645446996955439e-06, + "loss": 0.0934, + "step": 44350 + }, + { + "epoch": 4.34, + "learning_rate": 5.64129532244672e-06, + "loss": 0.0815, + "step": 44355 + }, + { + "epoch": 4.34, + "learning_rate": 5.637143647938002e-06, + "loss": 0.115, + "step": 44360 + }, + { + "epoch": 4.34, + "learning_rate": 5.632991973429284e-06, + "loss": 0.0896, + "step": 44365 + }, + { + "epoch": 4.34, + "learning_rate": 5.628840298920564e-06, + "loss": 0.098, + "step": 44370 + }, + { + "epoch": 4.34, + "learning_rate": 5.624688624411846e-06, + "loss": 0.0983, + "step": 44375 + }, + { + "epoch": 4.34, + "learning_rate": 5.620536949903128e-06, + "loss": 0.0989, + "step": 44380 + }, + { + "epoch": 4.34, + "learning_rate": 5.616385275394409e-06, + "loss": 0.0812, + "step": 44385 + }, + { + "epoch": 4.34, + "learning_rate": 5.612233600885691e-06, + "loss": 0.0766, + "step": 44390 + }, + { + "epoch": 4.34, + "learning_rate": 5.608081926376972e-06, + "loss": 0.0963, + "step": 44395 + }, + { + "epoch": 4.34, + "learning_rate": 5.603930251868254e-06, + "loss": 0.0906, + "step": 44400 + }, + { + "epoch": 4.34, + "learning_rate": 5.599778577359535e-06, + "loss": 0.0849, + "step": 44405 + }, + { + "epoch": 4.34, + "learning_rate": 5.595626902850817e-06, + "loss": 0.0985, + "step": 44410 + }, + { + "epoch": 4.34, + "learning_rate": 5.591475228342098e-06, + "loss": 0.0907, + "step": 44415 + }, + { + "epoch": 4.34, + "learning_rate": 5.58732355383338e-06, + "loss": 0.1137, + "step": 44420 + }, + { + "epoch": 4.34, + "learning_rate": 5.583171879324661e-06, + "loss": 0.0979, + "step": 44425 + }, + { + "epoch": 4.34, + "learning_rate": 5.579020204815942e-06, + "loss": 0.088, + "step": 44430 + }, + { + "epoch": 4.35, + "learning_rate": 5.5748685303072245e-06, + "loss": 0.0908, + "step": 44435 + }, + { + "epoch": 4.35, + "learning_rate": 5.570716855798505e-06, + "loss": 0.0748, + "step": 44440 + }, + { + "epoch": 4.35, + "learning_rate": 5.566565181289787e-06, + "loss": 0.1074, + "step": 44445 + }, + { + "epoch": 4.35, + "learning_rate": 5.5624135067810685e-06, + "loss": 0.0978, + "step": 44450 + }, + { + "epoch": 4.35, + "learning_rate": 5.55826183227235e-06, + "loss": 0.0782, + "step": 44455 + }, + { + "epoch": 4.35, + "learning_rate": 5.554110157763632e-06, + "loss": 0.0899, + "step": 44460 + }, + { + "epoch": 4.35, + "learning_rate": 5.549958483254913e-06, + "loss": 0.0753, + "step": 44465 + }, + { + "epoch": 4.35, + "learning_rate": 5.545806808746194e-06, + "loss": 0.0781, + "step": 44470 + }, + { + "epoch": 4.35, + "learning_rate": 5.541655134237477e-06, + "loss": 0.105, + "step": 44475 + }, + { + "epoch": 4.35, + "learning_rate": 5.537503459728757e-06, + "loss": 0.0864, + "step": 44480 + }, + { + "epoch": 4.35, + "learning_rate": 5.533351785220038e-06, + "loss": 0.0911, + "step": 44485 + }, + { + "epoch": 4.35, + "learning_rate": 5.529200110711321e-06, + "loss": 0.0862, + "step": 44490 + }, + { + "epoch": 4.35, + "learning_rate": 5.525048436202601e-06, + "loss": 0.1017, + "step": 44495 + }, + { + "epoch": 4.35, + "learning_rate": 5.520896761693884e-06, + "loss": 0.0878, + "step": 44500 + }, + { + "epoch": 4.35, + "eval_cer": 0.05375158103086681, + "eval_loss": 0.22322100400924683, + "eval_runtime": 279.5723, + "eval_samples_per_second": 58.554, + "eval_steps_per_second": 1.627, + "eval_wer": 0.13828905010349804, + "step": 44500 + }, + { + "epoch": 4.35, + "learning_rate": 5.516745087185165e-06, + "loss": 0.0896, + "step": 44505 + }, + { + "epoch": 4.35, + "learning_rate": 5.512593412676446e-06, + "loss": 0.113, + "step": 44510 + }, + { + "epoch": 4.35, + "learning_rate": 5.508441738167728e-06, + "loss": 0.1042, + "step": 44515 + }, + { + "epoch": 4.35, + "learning_rate": 5.5042900636590094e-06, + "loss": 0.0841, + "step": 44520 + }, + { + "epoch": 4.35, + "learning_rate": 5.500138389150291e-06, + "loss": 0.1006, + "step": 44525 + }, + { + "epoch": 4.35, + "learning_rate": 5.495986714641573e-06, + "loss": 0.0953, + "step": 44530 + }, + { + "epoch": 4.35, + "learning_rate": 5.4918350401328534e-06, + "loss": 0.0769, + "step": 44535 + }, + { + "epoch": 4.36, + "learning_rate": 5.487683365624135e-06, + "loss": 0.076, + "step": 44540 + }, + { + "epoch": 4.36, + "learning_rate": 5.483531691115417e-06, + "loss": 0.1077, + "step": 44545 + }, + { + "epoch": 4.36, + "learning_rate": 5.479380016606698e-06, + "loss": 0.0901, + "step": 44550 + }, + { + "epoch": 4.36, + "learning_rate": 5.47522834209798e-06, + "loss": 0.0975, + "step": 44555 + }, + { + "epoch": 4.36, + "learning_rate": 5.471076667589261e-06, + "loss": 0.1245, + "step": 44560 + }, + { + "epoch": 4.36, + "learning_rate": 5.466924993080543e-06, + "loss": 0.0937, + "step": 44565 + }, + { + "epoch": 4.36, + "learning_rate": 5.462773318571824e-06, + "loss": 0.0938, + "step": 44570 + }, + { + "epoch": 4.36, + "learning_rate": 5.4586216440631055e-06, + "loss": 0.1087, + "step": 44575 + }, + { + "epoch": 4.36, + "learning_rate": 5.454469969554387e-06, + "loss": 0.097, + "step": 44580 + }, + { + "epoch": 4.36, + "learning_rate": 5.450318295045668e-06, + "loss": 0.096, + "step": 44585 + }, + { + "epoch": 4.36, + "learning_rate": 5.44616662053695e-06, + "loss": 0.076, + "step": 44590 + }, + { + "epoch": 4.36, + "learning_rate": 5.442014946028231e-06, + "loss": 0.0988, + "step": 44595 + }, + { + "epoch": 4.36, + "learning_rate": 5.437863271519513e-06, + "loss": 0.0787, + "step": 44600 + }, + { + "epoch": 4.36, + "learning_rate": 5.433711597010794e-06, + "loss": 0.0774, + "step": 44605 + }, + { + "epoch": 4.36, + "learning_rate": 5.429559922502076e-06, + "loss": 0.0963, + "step": 44610 + }, + { + "epoch": 4.36, + "learning_rate": 5.425408247993358e-06, + "loss": 0.0893, + "step": 44615 + }, + { + "epoch": 4.36, + "learning_rate": 5.421256573484639e-06, + "loss": 0.0913, + "step": 44620 + }, + { + "epoch": 4.36, + "learning_rate": 5.41710489897592e-06, + "loss": 0.095, + "step": 44625 + }, + { + "epoch": 4.36, + "learning_rate": 5.4129532244672024e-06, + "loss": 0.0889, + "step": 44630 + }, + { + "epoch": 4.36, + "learning_rate": 5.408801549958483e-06, + "loss": 0.0908, + "step": 44635 + }, + { + "epoch": 4.37, + "learning_rate": 5.404649875449765e-06, + "loss": 0.0895, + "step": 44640 + }, + { + "epoch": 4.37, + "learning_rate": 5.4004982009410464e-06, + "loss": 0.1166, + "step": 44645 + }, + { + "epoch": 4.37, + "learning_rate": 5.396346526432327e-06, + "loss": 0.0985, + "step": 44650 + }, + { + "epoch": 4.37, + "learning_rate": 5.39219485192361e-06, + "loss": 0.0797, + "step": 44655 + }, + { + "epoch": 4.37, + "learning_rate": 5.3880431774148904e-06, + "loss": 0.1062, + "step": 44660 + }, + { + "epoch": 4.37, + "learning_rate": 5.383891502906173e-06, + "loss": 0.0904, + "step": 44665 + }, + { + "epoch": 4.37, + "learning_rate": 5.379739828397454e-06, + "loss": 0.0769, + "step": 44670 + }, + { + "epoch": 4.37, + "learning_rate": 5.375588153888735e-06, + "loss": 0.0889, + "step": 44675 + }, + { + "epoch": 4.37, + "learning_rate": 5.371436479380017e-06, + "loss": 0.0948, + "step": 44680 + }, + { + "epoch": 4.37, + "learning_rate": 5.3672848048712985e-06, + "loss": 0.0863, + "step": 44685 + }, + { + "epoch": 4.37, + "learning_rate": 5.363133130362579e-06, + "loss": 0.0934, + "step": 44690 + }, + { + "epoch": 4.37, + "learning_rate": 5.358981455853861e-06, + "loss": 0.1117, + "step": 44695 + }, + { + "epoch": 4.37, + "learning_rate": 5.3548297813451425e-06, + "loss": 0.0798, + "step": 44700 + }, + { + "epoch": 4.37, + "learning_rate": 5.350678106836424e-06, + "loss": 0.0887, + "step": 44705 + }, + { + "epoch": 4.37, + "learning_rate": 5.346526432327706e-06, + "loss": 0.1088, + "step": 44710 + }, + { + "epoch": 4.37, + "learning_rate": 5.3423747578189865e-06, + "loss": 0.0909, + "step": 44715 + }, + { + "epoch": 4.37, + "learning_rate": 5.338223083310269e-06, + "loss": 0.0766, + "step": 44720 + }, + { + "epoch": 4.37, + "learning_rate": 5.33407140880155e-06, + "loss": 0.0914, + "step": 44725 + }, + { + "epoch": 4.37, + "learning_rate": 5.329919734292832e-06, + "loss": 0.0852, + "step": 44730 + }, + { + "epoch": 4.37, + "learning_rate": 5.325768059784113e-06, + "loss": 0.0713, + "step": 44735 + }, + { + "epoch": 4.37, + "learning_rate": 5.321616385275395e-06, + "loss": 0.087, + "step": 44740 + }, + { + "epoch": 4.38, + "learning_rate": 5.317464710766676e-06, + "loss": 0.1142, + "step": 44745 + }, + { + "epoch": 4.38, + "learning_rate": 5.313313036257957e-06, + "loss": 0.0862, + "step": 44750 + }, + { + "epoch": 4.38, + "learning_rate": 5.3091613617492394e-06, + "loss": 0.0879, + "step": 44755 + }, + { + "epoch": 4.38, + "learning_rate": 5.30500968724052e-06, + "loss": 0.1014, + "step": 44760 + }, + { + "epoch": 4.38, + "learning_rate": 5.300858012731802e-06, + "loss": 0.0919, + "step": 44765 + }, + { + "epoch": 4.38, + "learning_rate": 5.2967063382230834e-06, + "loss": 0.0785, + "step": 44770 + }, + { + "epoch": 4.38, + "learning_rate": 5.292554663714365e-06, + "loss": 0.1033, + "step": 44775 + }, + { + "epoch": 4.38, + "learning_rate": 5.288402989205646e-06, + "loss": 0.1032, + "step": 44780 + }, + { + "epoch": 4.38, + "learning_rate": 5.284251314696928e-06, + "loss": 0.0816, + "step": 44785 + }, + { + "epoch": 4.38, + "learning_rate": 5.280099640188209e-06, + "loss": 0.0959, + "step": 44790 + }, + { + "epoch": 4.38, + "learning_rate": 5.2759479656794915e-06, + "loss": 0.1062, + "step": 44795 + }, + { + "epoch": 4.38, + "learning_rate": 5.271796291170772e-06, + "loss": 0.0892, + "step": 44800 + }, + { + "epoch": 4.38, + "learning_rate": 5.267644616662053e-06, + "loss": 0.0703, + "step": 44805 + }, + { + "epoch": 4.38, + "learning_rate": 5.2634929421533355e-06, + "loss": 0.0957, + "step": 44810 + }, + { + "epoch": 4.38, + "learning_rate": 5.259341267644616e-06, + "loss": 0.0828, + "step": 44815 + }, + { + "epoch": 4.38, + "learning_rate": 5.255189593135899e-06, + "loss": 0.0785, + "step": 44820 + }, + { + "epoch": 4.38, + "learning_rate": 5.2510379186271795e-06, + "loss": 0.1023, + "step": 44825 + }, + { + "epoch": 4.38, + "learning_rate": 5.246886244118461e-06, + "loss": 0.089, + "step": 44830 + }, + { + "epoch": 4.38, + "learning_rate": 5.242734569609743e-06, + "loss": 0.0848, + "step": 44835 + }, + { + "epoch": 4.38, + "learning_rate": 5.238582895101024e-06, + "loss": 0.085, + "step": 44840 + }, + { + "epoch": 4.39, + "learning_rate": 5.234431220592306e-06, + "loss": 0.1045, + "step": 44845 + }, + { + "epoch": 4.39, + "learning_rate": 5.230279546083588e-06, + "loss": 0.0897, + "step": 44850 + }, + { + "epoch": 4.39, + "learning_rate": 5.226127871574868e-06, + "loss": 0.0908, + "step": 44855 + }, + { + "epoch": 4.39, + "learning_rate": 5.22197619706615e-06, + "loss": 0.0993, + "step": 44860 + }, + { + "epoch": 4.39, + "learning_rate": 5.217824522557432e-06, + "loss": 0.0807, + "step": 44865 + }, + { + "epoch": 4.39, + "learning_rate": 5.213672848048713e-06, + "loss": 0.0821, + "step": 44870 + }, + { + "epoch": 4.39, + "learning_rate": 5.209521173539995e-06, + "loss": 0.1153, + "step": 44875 + }, + { + "epoch": 4.39, + "learning_rate": 5.205369499031276e-06, + "loss": 0.0893, + "step": 44880 + }, + { + "epoch": 4.39, + "learning_rate": 5.201217824522558e-06, + "loss": 0.0804, + "step": 44885 + }, + { + "epoch": 4.39, + "learning_rate": 5.197066150013839e-06, + "loss": 0.0763, + "step": 44890 + }, + { + "epoch": 4.39, + "learning_rate": 5.1929144755051204e-06, + "loss": 0.109, + "step": 44895 + }, + { + "epoch": 4.39, + "learning_rate": 5.188762800996402e-06, + "loss": 0.0946, + "step": 44900 + }, + { + "epoch": 4.39, + "learning_rate": 5.184611126487684e-06, + "loss": 0.0761, + "step": 44905 + }, + { + "epoch": 4.39, + "learning_rate": 5.180459451978965e-06, + "loss": 0.1004, + "step": 44910 + }, + { + "epoch": 4.39, + "learning_rate": 5.176307777470246e-06, + "loss": 0.1009, + "step": 44915 + }, + { + "epoch": 4.39, + "learning_rate": 5.172156102961528e-06, + "loss": 0.0882, + "step": 44920 + }, + { + "epoch": 4.39, + "learning_rate": 5.168004428452809e-06, + "loss": 0.0904, + "step": 44925 + }, + { + "epoch": 4.39, + "learning_rate": 5.163852753944091e-06, + "loss": 0.082, + "step": 44930 + }, + { + "epoch": 4.39, + "learning_rate": 5.1597010794353725e-06, + "loss": 0.0815, + "step": 44935 + }, + { + "epoch": 4.39, + "learning_rate": 5.155549404926654e-06, + "loss": 0.0802, + "step": 44940 + }, + { + "epoch": 4.39, + "learning_rate": 5.151397730417935e-06, + "loss": 0.1055, + "step": 44945 + }, + { + "epoch": 4.4, + "learning_rate": 5.147246055909217e-06, + "loss": 0.0777, + "step": 44950 + }, + { + "epoch": 4.4, + "learning_rate": 5.143094381400498e-06, + "loss": 0.093, + "step": 44955 + }, + { + "epoch": 4.4, + "learning_rate": 5.138942706891781e-06, + "loss": 0.1069, + "step": 44960 + }, + { + "epoch": 4.4, + "learning_rate": 5.134791032383061e-06, + "loss": 0.0798, + "step": 44965 + }, + { + "epoch": 4.4, + "learning_rate": 5.130639357874342e-06, + "loss": 0.0818, + "step": 44970 + }, + { + "epoch": 4.4, + "learning_rate": 5.126487683365625e-06, + "loss": 0.1113, + "step": 44975 + }, + { + "epoch": 4.4, + "learning_rate": 5.122336008856905e-06, + "loss": 0.0954, + "step": 44980 + }, + { + "epoch": 4.4, + "learning_rate": 5.118184334348187e-06, + "loss": 0.0776, + "step": 44985 + }, + { + "epoch": 4.4, + "learning_rate": 5.114032659839469e-06, + "loss": 0.089, + "step": 44990 + }, + { + "epoch": 4.4, + "learning_rate": 5.10988098533075e-06, + "loss": 0.0946, + "step": 44995 + }, + { + "epoch": 4.4, + "learning_rate": 5.105729310822032e-06, + "loss": 0.0837, + "step": 45000 + }, + { + "epoch": 4.4, + "eval_cer": 0.05398396655498288, + "eval_loss": 0.22579458355903625, + "eval_runtime": 277.7689, + "eval_samples_per_second": 58.934, + "eval_steps_per_second": 1.638, + "eval_wer": 0.13809315476384817, + "step": 45000 + }, + { + "epoch": 4.4, + "learning_rate": 5.1015776363133134e-06, + "loss": 0.0833, + "step": 45005 + }, + { + "epoch": 4.4, + "learning_rate": 5.097425961804594e-06, + "loss": 0.0965, + "step": 45010 + }, + { + "epoch": 4.4, + "learning_rate": 5.093274287295877e-06, + "loss": 0.0904, + "step": 45015 + }, + { + "epoch": 4.4, + "learning_rate": 5.0891226127871574e-06, + "loss": 0.0889, + "step": 45020 + }, + { + "epoch": 4.4, + "learning_rate": 5.084970938278439e-06, + "loss": 0.0997, + "step": 45025 + }, + { + "epoch": 4.4, + "learning_rate": 5.080819263769721e-06, + "loss": 0.0914, + "step": 45030 + }, + { + "epoch": 4.4, + "learning_rate": 5.0766675892610014e-06, + "loss": 0.0824, + "step": 45035 + }, + { + "epoch": 4.4, + "learning_rate": 5.072515914752284e-06, + "loss": 0.0828, + "step": 45040 + }, + { + "epoch": 4.4, + "learning_rate": 5.068364240243565e-06, + "loss": 0.1115, + "step": 45045 + }, + { + "epoch": 4.41, + "learning_rate": 5.064212565734847e-06, + "loss": 0.0878, + "step": 45050 + }, + { + "epoch": 4.41, + "learning_rate": 5.060060891226128e-06, + "loss": 0.0847, + "step": 45055 + }, + { + "epoch": 4.41, + "learning_rate": 5.0559092167174095e-06, + "loss": 0.1067, + "step": 45060 + }, + { + "epoch": 4.41, + "learning_rate": 5.051757542208691e-06, + "loss": 0.088, + "step": 45065 + }, + { + "epoch": 4.41, + "learning_rate": 5.047605867699973e-06, + "loss": 0.0818, + "step": 45070 + }, + { + "epoch": 4.41, + "learning_rate": 5.043454193191254e-06, + "loss": 0.1111, + "step": 45075 + }, + { + "epoch": 4.41, + "learning_rate": 5.039302518682535e-06, + "loss": 0.0984, + "step": 45080 + }, + { + "epoch": 4.41, + "learning_rate": 5.035150844173817e-06, + "loss": 0.0871, + "step": 45085 + }, + { + "epoch": 4.41, + "learning_rate": 5.030999169665098e-06, + "loss": 0.1031, + "step": 45090 + }, + { + "epoch": 4.41, + "learning_rate": 5.02684749515638e-06, + "loss": 0.1041, + "step": 45095 + }, + { + "epoch": 4.41, + "learning_rate": 5.022695820647661e-06, + "loss": 0.0929, + "step": 45100 + }, + { + "epoch": 4.41, + "learning_rate": 5.018544146138943e-06, + "loss": 0.0914, + "step": 45105 + }, + { + "epoch": 4.41, + "learning_rate": 5.014392471630224e-06, + "loss": 0.1075, + "step": 45110 + }, + { + "epoch": 4.41, + "learning_rate": 5.0102407971215064e-06, + "loss": 0.0935, + "step": 45115 + }, + { + "epoch": 4.41, + "learning_rate": 5.006089122612787e-06, + "loss": 0.098, + "step": 45120 + }, + { + "epoch": 4.41, + "learning_rate": 5.001937448104069e-06, + "loss": 0.1144, + "step": 45125 + }, + { + "epoch": 4.41, + "learning_rate": 4.9977857735953504e-06, + "loss": 0.0796, + "step": 45130 + }, + { + "epoch": 4.41, + "learning_rate": 4.993634099086631e-06, + "loss": 0.0795, + "step": 45135 + }, + { + "epoch": 4.41, + "learning_rate": 4.989482424577914e-06, + "loss": 0.073, + "step": 45140 + }, + { + "epoch": 4.41, + "learning_rate": 4.9853307500691944e-06, + "loss": 0.1021, + "step": 45145 + }, + { + "epoch": 4.41, + "learning_rate": 4.981179075560476e-06, + "loss": 0.1008, + "step": 45150 + }, + { + "epoch": 4.42, + "learning_rate": 4.977027401051758e-06, + "loss": 0.0765, + "step": 45155 + }, + { + "epoch": 4.42, + "learning_rate": 4.972875726543039e-06, + "loss": 0.1105, + "step": 45160 + }, + { + "epoch": 4.42, + "learning_rate": 4.968724052034321e-06, + "loss": 0.0946, + "step": 45165 + }, + { + "epoch": 4.42, + "learning_rate": 4.9645723775256025e-06, + "loss": 0.0801, + "step": 45170 + }, + { + "epoch": 4.42, + "learning_rate": 4.960420703016883e-06, + "loss": 0.0943, + "step": 45175 + }, + { + "epoch": 4.42, + "learning_rate": 4.956269028508166e-06, + "loss": 0.0963, + "step": 45180 + }, + { + "epoch": 4.42, + "learning_rate": 4.9521173539994465e-06, + "loss": 0.0879, + "step": 45185 + }, + { + "epoch": 4.42, + "learning_rate": 4.947965679490727e-06, + "loss": 0.0937, + "step": 45190 + }, + { + "epoch": 4.42, + "learning_rate": 4.94381400498201e-06, + "loss": 0.1096, + "step": 45195 + }, + { + "epoch": 4.42, + "learning_rate": 4.9396623304732905e-06, + "loss": 0.0899, + "step": 45200 + }, + { + "epoch": 4.42, + "learning_rate": 4.935510655964573e-06, + "loss": 0.0855, + "step": 45205 + }, + { + "epoch": 4.42, + "learning_rate": 4.931358981455854e-06, + "loss": 0.1064, + "step": 45210 + }, + { + "epoch": 4.42, + "learning_rate": 4.927207306947135e-06, + "loss": 0.0915, + "step": 45215 + }, + { + "epoch": 4.42, + "learning_rate": 4.923055632438417e-06, + "loss": 0.0716, + "step": 45220 + }, + { + "epoch": 4.42, + "learning_rate": 4.9197342928314424e-06, + "loss": 0.1149, + "step": 45225 + }, + { + "epoch": 4.42, + "learning_rate": 4.915582618322724e-06, + "loss": 0.0876, + "step": 45230 + }, + { + "epoch": 4.42, + "learning_rate": 4.911430943814005e-06, + "loss": 0.0748, + "step": 45235 + }, + { + "epoch": 4.42, + "learning_rate": 4.9072792693052864e-06, + "loss": 0.0757, + "step": 45240 + }, + { + "epoch": 4.42, + "learning_rate": 4.903127594796568e-06, + "loss": 0.1095, + "step": 45245 + }, + { + "epoch": 4.42, + "learning_rate": 4.89897592028785e-06, + "loss": 0.0816, + "step": 45250 + }, + { + "epoch": 4.43, + "learning_rate": 4.894824245779131e-06, + "loss": 0.0947, + "step": 45255 + }, + { + "epoch": 4.43, + "learning_rate": 4.890672571270412e-06, + "loss": 0.1088, + "step": 45260 + }, + { + "epoch": 4.43, + "learning_rate": 4.8865208967616945e-06, + "loss": 0.0841, + "step": 45265 + }, + { + "epoch": 4.43, + "learning_rate": 4.882369222252975e-06, + "loss": 0.0849, + "step": 45270 + }, + { + "epoch": 4.43, + "learning_rate": 4.878217547744257e-06, + "loss": 0.114, + "step": 45275 + }, + { + "epoch": 4.43, + "learning_rate": 4.8740658732355385e-06, + "loss": 0.0858, + "step": 45280 + }, + { + "epoch": 4.43, + "learning_rate": 4.86991419872682e-06, + "loss": 0.0786, + "step": 45285 + }, + { + "epoch": 4.43, + "learning_rate": 4.865762524218102e-06, + "loss": 0.0881, + "step": 45290 + }, + { + "epoch": 4.43, + "learning_rate": 4.8616108497093825e-06, + "loss": 0.1168, + "step": 45295 + }, + { + "epoch": 4.43, + "learning_rate": 4.857459175200664e-06, + "loss": 0.0964, + "step": 45300 + }, + { + "epoch": 4.43, + "learning_rate": 4.853307500691946e-06, + "loss": 0.0861, + "step": 45305 + }, + { + "epoch": 4.43, + "learning_rate": 4.849155826183227e-06, + "loss": 0.1244, + "step": 45310 + }, + { + "epoch": 4.43, + "learning_rate": 4.845004151674509e-06, + "loss": 0.0988, + "step": 45315 + }, + { + "epoch": 4.43, + "learning_rate": 4.840852477165791e-06, + "loss": 0.0877, + "step": 45320 + }, + { + "epoch": 4.43, + "learning_rate": 4.836700802657071e-06, + "loss": 0.0979, + "step": 45325 + }, + { + "epoch": 4.43, + "learning_rate": 4.832549128148354e-06, + "loss": 0.0953, + "step": 45330 + }, + { + "epoch": 4.43, + "learning_rate": 4.828397453639635e-06, + "loss": 0.0774, + "step": 45335 + }, + { + "epoch": 4.43, + "learning_rate": 4.824245779130917e-06, + "loss": 0.0932, + "step": 45340 + }, + { + "epoch": 4.43, + "learning_rate": 4.820094104622198e-06, + "loss": 0.1079, + "step": 45345 + }, + { + "epoch": 4.43, + "learning_rate": 4.815942430113479e-06, + "loss": 0.0844, + "step": 45350 + }, + { + "epoch": 4.43, + "learning_rate": 4.811790755604761e-06, + "loss": 0.0734, + "step": 45355 + }, + { + "epoch": 4.44, + "learning_rate": 4.807639081096042e-06, + "loss": 0.1054, + "step": 45360 + }, + { + "epoch": 4.44, + "learning_rate": 4.8034874065873234e-06, + "loss": 0.083, + "step": 45365 + }, + { + "epoch": 4.44, + "learning_rate": 4.799335732078605e-06, + "loss": 0.0948, + "step": 45370 + }, + { + "epoch": 4.44, + "learning_rate": 4.795184057569887e-06, + "loss": 0.1061, + "step": 45375 + }, + { + "epoch": 4.44, + "learning_rate": 4.791032383061168e-06, + "loss": 0.0995, + "step": 45380 + }, + { + "epoch": 4.44, + "learning_rate": 4.78688070855245e-06, + "loss": 0.0821, + "step": 45385 + }, + { + "epoch": 4.44, + "learning_rate": 4.782729034043731e-06, + "loss": 0.0836, + "step": 45390 + }, + { + "epoch": 4.44, + "learning_rate": 4.778577359535013e-06, + "loss": 0.103, + "step": 45395 + }, + { + "epoch": 4.44, + "learning_rate": 4.774425685026294e-06, + "loss": 0.0935, + "step": 45400 + }, + { + "epoch": 4.44, + "learning_rate": 4.7702740105175755e-06, + "loss": 0.0862, + "step": 45405 + }, + { + "epoch": 4.44, + "learning_rate": 4.766122336008857e-06, + "loss": 0.1059, + "step": 45410 + }, + { + "epoch": 4.44, + "learning_rate": 4.761970661500138e-06, + "loss": 0.0969, + "step": 45415 + }, + { + "epoch": 4.44, + "learning_rate": 4.75781898699142e-06, + "loss": 0.0976, + "step": 45420 + }, + { + "epoch": 4.44, + "learning_rate": 4.753667312482701e-06, + "loss": 0.107, + "step": 45425 + }, + { + "epoch": 4.44, + "learning_rate": 4.749515637973984e-06, + "loss": 0.0951, + "step": 45430 + }, + { + "epoch": 4.44, + "learning_rate": 4.745363963465264e-06, + "loss": 0.0912, + "step": 45435 + }, + { + "epoch": 4.44, + "learning_rate": 4.741212288956546e-06, + "loss": 0.0929, + "step": 45440 + }, + { + "epoch": 4.44, + "learning_rate": 4.737060614447828e-06, + "loss": 0.1063, + "step": 45445 + }, + { + "epoch": 4.44, + "learning_rate": 4.732908939939109e-06, + "loss": 0.0979, + "step": 45450 + }, + { + "epoch": 4.44, + "learning_rate": 4.72875726543039e-06, + "loss": 0.0759, + "step": 45455 + }, + { + "epoch": 4.45, + "learning_rate": 4.724605590921672e-06, + "loss": 0.1056, + "step": 45460 + }, + { + "epoch": 4.45, + "learning_rate": 4.720453916412953e-06, + "loss": 0.0812, + "step": 45465 + }, + { + "epoch": 4.45, + "learning_rate": 4.716302241904235e-06, + "loss": 0.0874, + "step": 45470 + }, + { + "epoch": 4.45, + "learning_rate": 4.7121505673955164e-06, + "loss": 0.1039, + "step": 45475 + }, + { + "epoch": 4.45, + "learning_rate": 4.707998892886797e-06, + "loss": 0.0996, + "step": 45480 + }, + { + "epoch": 4.45, + "learning_rate": 4.70384721837808e-06, + "loss": 0.0689, + "step": 45485 + }, + { + "epoch": 4.45, + "learning_rate": 4.6996955438693604e-06, + "loss": 0.0942, + "step": 45490 + }, + { + "epoch": 4.45, + "learning_rate": 4.695543869360643e-06, + "loss": 0.1149, + "step": 45495 + }, + { + "epoch": 4.45, + "learning_rate": 4.691392194851924e-06, + "loss": 0.0917, + "step": 45500 + }, + { + "epoch": 4.45, + "eval_cer": 0.053514570919206146, + "eval_loss": 0.22113968431949615, + "eval_runtime": 276.2739, + "eval_samples_per_second": 59.253, + "eval_steps_per_second": 1.647, + "eval_wer": 0.13710714822094383, + "step": 45500 + }, + { + "epoch": 4.45, + "learning_rate": 4.687240520343205e-06, + "loss": 0.0815, + "step": 45505 + }, + { + "epoch": 4.45, + "learning_rate": 4.683088845834487e-06, + "loss": 0.1122, + "step": 45510 + }, + { + "epoch": 4.45, + "learning_rate": 4.678937171325768e-06, + "loss": 0.0914, + "step": 45515 + }, + { + "epoch": 4.45, + "learning_rate": 4.67478549681705e-06, + "loss": 0.0876, + "step": 45520 + }, + { + "epoch": 4.45, + "learning_rate": 4.670633822308331e-06, + "loss": 0.0953, + "step": 45525 + }, + { + "epoch": 4.45, + "learning_rate": 4.6664821477996125e-06, + "loss": 0.0954, + "step": 45530 + }, + { + "epoch": 4.45, + "learning_rate": 4.662330473290894e-06, + "loss": 0.0824, + "step": 45535 + }, + { + "epoch": 4.45, + "learning_rate": 4.658178798782176e-06, + "loss": 0.102, + "step": 45540 + }, + { + "epoch": 4.45, + "learning_rate": 4.654027124273457e-06, + "loss": 0.0958, + "step": 45545 + }, + { + "epoch": 4.45, + "learning_rate": 4.649875449764739e-06, + "loss": 0.0831, + "step": 45550 + }, + { + "epoch": 4.45, + "learning_rate": 4.64572377525602e-06, + "loss": 0.0929, + "step": 45555 + }, + { + "epoch": 4.46, + "learning_rate": 4.641572100747302e-06, + "loss": 0.1088, + "step": 45560 + }, + { + "epoch": 4.46, + "learning_rate": 4.637420426238583e-06, + "loss": 0.0934, + "step": 45565 + }, + { + "epoch": 4.46, + "learning_rate": 4.633268751729864e-06, + "loss": 0.0759, + "step": 45570 + }, + { + "epoch": 4.46, + "learning_rate": 4.629117077221146e-06, + "loss": 0.0948, + "step": 45575 + }, + { + "epoch": 4.46, + "learning_rate": 4.624965402712427e-06, + "loss": 0.1046, + "step": 45580 + }, + { + "epoch": 4.46, + "learning_rate": 4.6208137282037094e-06, + "loss": 0.0814, + "step": 45585 + }, + { + "epoch": 4.46, + "learning_rate": 4.61666205369499e-06, + "loss": 0.1007, + "step": 45590 + }, + { + "epoch": 4.46, + "learning_rate": 4.612510379186272e-06, + "loss": 0.0986, + "step": 45595 + }, + { + "epoch": 4.46, + "learning_rate": 4.6083587046775534e-06, + "loss": 0.0885, + "step": 45600 + }, + { + "epoch": 4.46, + "learning_rate": 4.604207030168835e-06, + "loss": 0.081, + "step": 45605 + }, + { + "epoch": 4.46, + "learning_rate": 4.600055355660117e-06, + "loss": 0.118, + "step": 45610 + }, + { + "epoch": 4.46, + "learning_rate": 4.595903681151398e-06, + "loss": 0.0811, + "step": 45615 + }, + { + "epoch": 4.46, + "learning_rate": 4.591752006642679e-06, + "loss": 0.0799, + "step": 45620 + }, + { + "epoch": 4.46, + "learning_rate": 4.587600332133961e-06, + "loss": 0.1149, + "step": 45625 + }, + { + "epoch": 4.46, + "learning_rate": 4.583448657625242e-06, + "loss": 0.0933, + "step": 45630 + }, + { + "epoch": 4.46, + "learning_rate": 4.579296983116524e-06, + "loss": 0.0745, + "step": 45635 + }, + { + "epoch": 4.46, + "learning_rate": 4.5751453086078055e-06, + "loss": 0.0888, + "step": 45640 + }, + { + "epoch": 4.46, + "learning_rate": 4.570993634099086e-06, + "loss": 0.1111, + "step": 45645 + }, + { + "epoch": 4.46, + "learning_rate": 4.566841959590369e-06, + "loss": 0.0826, + "step": 45650 + }, + { + "epoch": 4.46, + "learning_rate": 4.5626902850816495e-06, + "loss": 0.0786, + "step": 45655 + }, + { + "epoch": 4.46, + "learning_rate": 4.558538610572931e-06, + "loss": 0.106, + "step": 45660 + }, + { + "epoch": 4.47, + "learning_rate": 4.554386936064213e-06, + "loss": 0.0845, + "step": 45665 + }, + { + "epoch": 4.47, + "learning_rate": 4.550235261555494e-06, + "loss": 0.0854, + "step": 45670 + }, + { + "epoch": 4.47, + "learning_rate": 4.546083587046776e-06, + "loss": 0.0935, + "step": 45675 + }, + { + "epoch": 4.47, + "learning_rate": 4.541931912538057e-06, + "loss": 0.0991, + "step": 45680 + }, + { + "epoch": 4.47, + "learning_rate": 4.537780238029338e-06, + "loss": 0.088, + "step": 45685 + }, + { + "epoch": 4.47, + "learning_rate": 4.53362856352062e-06, + "loss": 0.1042, + "step": 45690 + }, + { + "epoch": 4.47, + "learning_rate": 4.5294768890119016e-06, + "loss": 0.1096, + "step": 45695 + }, + { + "epoch": 4.47, + "learning_rate": 4.525325214503183e-06, + "loss": 0.0844, + "step": 45700 + }, + { + "epoch": 4.47, + "learning_rate": 4.521173539994465e-06, + "loss": 0.0761, + "step": 45705 + }, + { + "epoch": 4.47, + "learning_rate": 4.5170218654857456e-06, + "loss": 0.1004, + "step": 45710 + }, + { + "epoch": 4.47, + "learning_rate": 4.512870190977028e-06, + "loss": 0.0837, + "step": 45715 + }, + { + "epoch": 4.47, + "learning_rate": 4.508718516468309e-06, + "loss": 0.068, + "step": 45720 + }, + { + "epoch": 4.47, + "learning_rate": 4.504566841959591e-06, + "loss": 0.1005, + "step": 45725 + }, + { + "epoch": 4.47, + "learning_rate": 4.500415167450872e-06, + "loss": 0.1061, + "step": 45730 + }, + { + "epoch": 4.47, + "learning_rate": 4.496263492942153e-06, + "loss": 0.0744, + "step": 45735 + }, + { + "epoch": 4.47, + "learning_rate": 4.492111818433435e-06, + "loss": 0.0936, + "step": 45740 + }, + { + "epoch": 4.47, + "learning_rate": 4.487960143924716e-06, + "loss": 0.1082, + "step": 45745 + }, + { + "epoch": 4.47, + "learning_rate": 4.4838084694159985e-06, + "loss": 0.0775, + "step": 45750 + }, + { + "epoch": 4.47, + "learning_rate": 4.479656794907279e-06, + "loss": 0.0889, + "step": 45755 + }, + { + "epoch": 4.47, + "learning_rate": 4.475505120398561e-06, + "loss": 0.1122, + "step": 45760 + }, + { + "epoch": 4.48, + "learning_rate": 4.4713534458898425e-06, + "loss": 0.0892, + "step": 45765 + }, + { + "epoch": 4.48, + "learning_rate": 4.467201771381124e-06, + "loss": 0.0882, + "step": 45770 + }, + { + "epoch": 4.48, + "learning_rate": 4.463050096872405e-06, + "loss": 0.0932, + "step": 45775 + }, + { + "epoch": 4.48, + "learning_rate": 4.4588984223636865e-06, + "loss": 0.0855, + "step": 45780 + }, + { + "epoch": 4.48, + "learning_rate": 4.454746747854968e-06, + "loss": 0.089, + "step": 45785 + }, + { + "epoch": 4.48, + "learning_rate": 4.45059507334625e-06, + "loss": 0.0785, + "step": 45790 + }, + { + "epoch": 4.48, + "learning_rate": 4.446443398837531e-06, + "loss": 0.0991, + "step": 45795 + }, + { + "epoch": 4.48, + "learning_rate": 4.442291724328812e-06, + "loss": 0.0819, + "step": 45800 + }, + { + "epoch": 4.48, + "learning_rate": 4.4381400498200946e-06, + "loss": 0.0797, + "step": 45805 + }, + { + "epoch": 4.48, + "learning_rate": 4.433988375311375e-06, + "loss": 0.1123, + "step": 45810 + }, + { + "epoch": 4.48, + "learning_rate": 4.429836700802658e-06, + "loss": 0.0877, + "step": 45815 + }, + { + "epoch": 4.48, + "learning_rate": 4.4256850262939386e-06, + "loss": 0.0928, + "step": 45820 + }, + { + "epoch": 4.48, + "learning_rate": 4.42153335178522e-06, + "loss": 0.1027, + "step": 45825 + }, + { + "epoch": 4.48, + "learning_rate": 4.417381677276502e-06, + "loss": 0.0988, + "step": 45830 + }, + { + "epoch": 4.48, + "learning_rate": 4.4132300027677826e-06, + "loss": 0.092, + "step": 45835 + }, + { + "epoch": 4.48, + "learning_rate": 4.409078328259065e-06, + "loss": 0.0828, + "step": 45840 + }, + { + "epoch": 4.48, + "learning_rate": 4.404926653750346e-06, + "loss": 0.1103, + "step": 45845 + }, + { + "epoch": 4.48, + "learning_rate": 4.400774979241627e-06, + "loss": 0.0975, + "step": 45850 + }, + { + "epoch": 4.48, + "learning_rate": 4.396623304732909e-06, + "loss": 0.0749, + "step": 45855 + }, + { + "epoch": 4.48, + "learning_rate": 4.392471630224191e-06, + "loss": 0.1204, + "step": 45860 + }, + { + "epoch": 4.48, + "learning_rate": 4.388319955715472e-06, + "loss": 0.0998, + "step": 45865 + }, + { + "epoch": 4.49, + "learning_rate": 4.384168281206754e-06, + "loss": 0.0808, + "step": 45870 + }, + { + "epoch": 4.49, + "learning_rate": 4.380016606698035e-06, + "loss": 0.096, + "step": 45875 + }, + { + "epoch": 4.49, + "learning_rate": 4.375864932189317e-06, + "loss": 0.0805, + "step": 45880 + }, + { + "epoch": 4.49, + "learning_rate": 4.371713257680598e-06, + "loss": 0.0819, + "step": 45885 + }, + { + "epoch": 4.49, + "learning_rate": 4.367561583171879e-06, + "loss": 0.0902, + "step": 45890 + }, + { + "epoch": 4.49, + "learning_rate": 4.363409908663161e-06, + "loss": 0.102, + "step": 45895 + }, + { + "epoch": 4.49, + "learning_rate": 4.359258234154442e-06, + "loss": 0.0882, + "step": 45900 + }, + { + "epoch": 4.49, + "learning_rate": 4.355106559645724e-06, + "loss": 0.0767, + "step": 45905 + }, + { + "epoch": 4.49, + "learning_rate": 4.350954885137005e-06, + "loss": 0.1038, + "step": 45910 + }, + { + "epoch": 4.49, + "learning_rate": 4.346803210628287e-06, + "loss": 0.0929, + "step": 45915 + }, + { + "epoch": 4.49, + "learning_rate": 4.342651536119568e-06, + "loss": 0.0749, + "step": 45920 + }, + { + "epoch": 4.49, + "learning_rate": 4.33849986161085e-06, + "loss": 0.1068, + "step": 45925 + }, + { + "epoch": 4.49, + "learning_rate": 4.3343481871021316e-06, + "loss": 0.0923, + "step": 45930 + }, + { + "epoch": 4.49, + "learning_rate": 4.330196512593413e-06, + "loss": 0.0753, + "step": 45935 + }, + { + "epoch": 4.49, + "learning_rate": 4.326044838084694e-06, + "loss": 0.0713, + "step": 45940 + }, + { + "epoch": 4.49, + "learning_rate": 4.3218931635759756e-06, + "loss": 0.1034, + "step": 45945 + }, + { + "epoch": 4.49, + "learning_rate": 4.317741489067257e-06, + "loss": 0.0882, + "step": 45950 + }, + { + "epoch": 4.49, + "learning_rate": 4.313589814558539e-06, + "loss": 0.1017, + "step": 45955 + }, + { + "epoch": 4.49, + "learning_rate": 4.30943814004982e-06, + "loss": 0.1004, + "step": 45960 + }, + { + "epoch": 4.49, + "learning_rate": 4.305286465541101e-06, + "loss": 0.0925, + "step": 45965 + }, + { + "epoch": 4.5, + "learning_rate": 4.301134791032384e-06, + "loss": 0.0921, + "step": 45970 + }, + { + "epoch": 4.5, + "learning_rate": 4.296983116523664e-06, + "loss": 0.1119, + "step": 45975 + }, + { + "epoch": 4.5, + "learning_rate": 4.292831442014946e-06, + "loss": 0.0968, + "step": 45980 + }, + { + "epoch": 4.5, + "learning_rate": 4.288679767506228e-06, + "loss": 0.0805, + "step": 45985 + }, + { + "epoch": 4.5, + "learning_rate": 4.284528092997509e-06, + "loss": 0.074, + "step": 45990 + }, + { + "epoch": 4.5, + "learning_rate": 4.280376418488791e-06, + "loss": 0.1009, + "step": 45995 + }, + { + "epoch": 4.5, + "learning_rate": 4.276224743980072e-06, + "loss": 0.0736, + "step": 46000 + }, + { + "epoch": 4.5, + "eval_cer": 0.053402424671249636, + "eval_loss": 0.22255557775497437, + "eval_runtime": 274.5397, + "eval_samples_per_second": 59.627, + "eval_steps_per_second": 1.657, + "eval_wer": 0.13644110406613427, + "step": 46000 + }, + { + "epoch": 4.5, + "learning_rate": 4.272073069471353e-06, + "loss": 0.0966, + "step": 46005 + }, + { + "epoch": 4.5, + "learning_rate": 4.267921394962635e-06, + "loss": 0.1104, + "step": 46010 + }, + { + "epoch": 4.5, + "learning_rate": 4.2637697204539165e-06, + "loss": 0.0814, + "step": 46015 + }, + { + "epoch": 4.5, + "learning_rate": 4.259618045945198e-06, + "loss": 0.0827, + "step": 46020 + }, + { + "epoch": 4.5, + "learning_rate": 4.25546637143648e-06, + "loss": 0.1083, + "step": 46025 + }, + { + "epoch": 4.5, + "learning_rate": 4.2513146969277605e-06, + "loss": 0.0902, + "step": 46030 + }, + { + "epoch": 4.5, + "learning_rate": 4.247163022419043e-06, + "loss": 0.0861, + "step": 46035 + }, + { + "epoch": 4.5, + "learning_rate": 4.243011347910324e-06, + "loss": 0.0752, + "step": 46040 + }, + { + "epoch": 4.5, + "learning_rate": 4.238859673401606e-06, + "loss": 0.1145, + "step": 46045 + }, + { + "epoch": 4.5, + "learning_rate": 4.234707998892887e-06, + "loss": 0.088, + "step": 46050 + }, + { + "epoch": 4.5, + "learning_rate": 4.230556324384168e-06, + "loss": 0.0733, + "step": 46055 + }, + { + "epoch": 4.5, + "learning_rate": 4.22640464987545e-06, + "loss": 0.1079, + "step": 46060 + }, + { + "epoch": 4.5, + "learning_rate": 4.222252975366731e-06, + "loss": 0.1036, + "step": 46065 + }, + { + "epoch": 4.5, + "learning_rate": 4.2181013008580126e-06, + "loss": 0.088, + "step": 46070 + }, + { + "epoch": 4.51, + "learning_rate": 4.213949626349294e-06, + "loss": 0.0997, + "step": 46075 + }, + { + "epoch": 4.51, + "learning_rate": 4.209797951840576e-06, + "loss": 0.0906, + "step": 46080 + }, + { + "epoch": 4.51, + "learning_rate": 4.205646277331857e-06, + "loss": 0.0967, + "step": 46085 + }, + { + "epoch": 4.51, + "learning_rate": 4.201494602823139e-06, + "loss": 0.09, + "step": 46090 + }, + { + "epoch": 4.51, + "learning_rate": 4.19734292831442e-06, + "loss": 0.0981, + "step": 46095 + }, + { + "epoch": 4.51, + "learning_rate": 4.193191253805702e-06, + "loss": 0.0885, + "step": 46100 + }, + { + "epoch": 4.51, + "learning_rate": 4.189039579296983e-06, + "loss": 0.0833, + "step": 46105 + }, + { + "epoch": 4.51, + "learning_rate": 4.184887904788265e-06, + "loss": 0.098, + "step": 46110 + }, + { + "epoch": 4.51, + "learning_rate": 4.180736230279546e-06, + "loss": 0.0883, + "step": 46115 + }, + { + "epoch": 4.51, + "learning_rate": 4.176584555770827e-06, + "loss": 0.0748, + "step": 46120 + }, + { + "epoch": 4.51, + "learning_rate": 4.1724328812621095e-06, + "loss": 0.105, + "step": 46125 + }, + { + "epoch": 4.51, + "learning_rate": 4.16828120675339e-06, + "loss": 0.0963, + "step": 46130 + }, + { + "epoch": 4.51, + "learning_rate": 4.164129532244673e-06, + "loss": 0.0864, + "step": 46135 + }, + { + "epoch": 4.51, + "learning_rate": 4.1599778577359535e-06, + "loss": 0.0806, + "step": 46140 + }, + { + "epoch": 4.51, + "learning_rate": 4.155826183227235e-06, + "loss": 0.1043, + "step": 46145 + }, + { + "epoch": 4.51, + "learning_rate": 4.151674508718517e-06, + "loss": 0.0807, + "step": 46150 + }, + { + "epoch": 4.51, + "learning_rate": 4.147522834209798e-06, + "loss": 0.0767, + "step": 46155 + }, + { + "epoch": 4.51, + "learning_rate": 4.14337115970108e-06, + "loss": 0.1161, + "step": 46160 + }, + { + "epoch": 4.51, + "learning_rate": 4.139219485192361e-06, + "loss": 0.0987, + "step": 46165 + }, + { + "epoch": 4.51, + "learning_rate": 4.135067810683642e-06, + "loss": 0.0785, + "step": 46170 + }, + { + "epoch": 4.52, + "learning_rate": 4.130916136174924e-06, + "loss": 0.1063, + "step": 46175 + }, + { + "epoch": 4.52, + "learning_rate": 4.1267644616662056e-06, + "loss": 0.0998, + "step": 46180 + }, + { + "epoch": 4.52, + "learning_rate": 4.122612787157486e-06, + "loss": 0.079, + "step": 46185 + }, + { + "epoch": 4.52, + "learning_rate": 4.118461112648769e-06, + "loss": 0.0827, + "step": 46190 + }, + { + "epoch": 4.52, + "learning_rate": 4.1143094381400496e-06, + "loss": 0.1188, + "step": 46195 + }, + { + "epoch": 4.52, + "learning_rate": 4.110157763631332e-06, + "loss": 0.0824, + "step": 46200 + }, + { + "epoch": 4.52, + "learning_rate": 4.106006089122613e-06, + "loss": 0.0823, + "step": 46205 + }, + { + "epoch": 4.52, + "learning_rate": 4.101854414613894e-06, + "loss": 0.111, + "step": 46210 + }, + { + "epoch": 4.52, + "learning_rate": 4.097702740105176e-06, + "loss": 0.0829, + "step": 46215 + }, + { + "epoch": 4.52, + "learning_rate": 4.093551065596457e-06, + "loss": 0.0778, + "step": 46220 + }, + { + "epoch": 4.52, + "learning_rate": 4.089399391087739e-06, + "loss": 0.0917, + "step": 46225 + }, + { + "epoch": 4.52, + "learning_rate": 4.08524771657902e-06, + "loss": 0.0946, + "step": 46230 + }, + { + "epoch": 4.52, + "learning_rate": 4.081096042070302e-06, + "loss": 0.0843, + "step": 46235 + }, + { + "epoch": 4.52, + "learning_rate": 4.076944367561583e-06, + "loss": 0.0919, + "step": 46240 + }, + { + "epoch": 4.52, + "learning_rate": 4.072792693052865e-06, + "loss": 0.091, + "step": 46245 + }, + { + "epoch": 4.52, + "learning_rate": 4.0686410185441465e-06, + "loss": 0.091, + "step": 46250 + }, + { + "epoch": 4.52, + "learning_rate": 4.064489344035428e-06, + "loss": 0.0875, + "step": 46255 + }, + { + "epoch": 4.52, + "learning_rate": 4.060337669526709e-06, + "loss": 0.1163, + "step": 46260 + }, + { + "epoch": 4.52, + "learning_rate": 4.056185995017991e-06, + "loss": 0.0894, + "step": 46265 + }, + { + "epoch": 4.52, + "learning_rate": 4.052034320509272e-06, + "loss": 0.084, + "step": 46270 + }, + { + "epoch": 4.52, + "learning_rate": 4.047882646000554e-06, + "loss": 0.0926, + "step": 46275 + }, + { + "epoch": 4.53, + "learning_rate": 4.043730971491835e-06, + "loss": 0.1003, + "step": 46280 + }, + { + "epoch": 4.53, + "learning_rate": 4.039579296983116e-06, + "loss": 0.0781, + "step": 46285 + }, + { + "epoch": 4.53, + "learning_rate": 4.0354276224743986e-06, + "loss": 0.0922, + "step": 46290 + }, + { + "epoch": 4.53, + "learning_rate": 4.031275947965679e-06, + "loss": 0.1045, + "step": 46295 + }, + { + "epoch": 4.53, + "learning_rate": 4.027124273456961e-06, + "loss": 0.0817, + "step": 46300 + }, + { + "epoch": 4.53, + "learning_rate": 4.0229725989482426e-06, + "loss": 0.0709, + "step": 46305 + }, + { + "epoch": 4.53, + "learning_rate": 4.018820924439524e-06, + "loss": 0.1163, + "step": 46310 + }, + { + "epoch": 4.53, + "learning_rate": 4.014669249930806e-06, + "loss": 0.0903, + "step": 46315 + }, + { + "epoch": 4.53, + "learning_rate": 4.010517575422087e-06, + "loss": 0.0871, + "step": 46320 + }, + { + "epoch": 4.53, + "learning_rate": 4.006365900913368e-06, + "loss": 0.0876, + "step": 46325 + }, + { + "epoch": 4.53, + "learning_rate": 4.00221422640465e-06, + "loss": 0.0883, + "step": 46330 + }, + { + "epoch": 4.53, + "learning_rate": 3.998062551895931e-06, + "loss": 0.0826, + "step": 46335 + }, + { + "epoch": 4.53, + "learning_rate": 3.993910877387213e-06, + "loss": 0.0825, + "step": 46340 + }, + { + "epoch": 4.53, + "learning_rate": 3.989759202878495e-06, + "loss": 0.0853, + "step": 46345 + }, + { + "epoch": 4.53, + "learning_rate": 3.985607528369775e-06, + "loss": 0.0841, + "step": 46350 + }, + { + "epoch": 4.53, + "learning_rate": 3.981455853861058e-06, + "loss": 0.0847, + "step": 46355 + }, + { + "epoch": 4.53, + "learning_rate": 3.977304179352339e-06, + "loss": 0.1044, + "step": 46360 + }, + { + "epoch": 4.53, + "learning_rate": 3.973152504843621e-06, + "loss": 0.0887, + "step": 46365 + }, + { + "epoch": 4.53, + "learning_rate": 3.969000830334902e-06, + "loss": 0.0825, + "step": 46370 + }, + { + "epoch": 4.53, + "learning_rate": 3.9648491558261835e-06, + "loss": 0.1213, + "step": 46375 + }, + { + "epoch": 4.54, + "learning_rate": 3.960697481317465e-06, + "loss": 0.0849, + "step": 46380 + }, + { + "epoch": 4.54, + "learning_rate": 3.956545806808746e-06, + "loss": 0.0899, + "step": 46385 + }, + { + "epoch": 4.54, + "learning_rate": 3.9523941323000275e-06, + "loss": 0.0886, + "step": 46390 + }, + { + "epoch": 4.54, + "learning_rate": 3.948242457791309e-06, + "loss": 0.1151, + "step": 46395 + }, + { + "epoch": 4.54, + "learning_rate": 3.944090783282591e-06, + "loss": 0.0842, + "step": 46400 + }, + { + "epoch": 4.54, + "learning_rate": 3.939939108773872e-06, + "loss": 0.0909, + "step": 46405 + }, + { + "epoch": 4.54, + "learning_rate": 3.935787434265154e-06, + "loss": 0.1053, + "step": 46410 + }, + { + "epoch": 4.54, + "learning_rate": 3.931635759756435e-06, + "loss": 0.0958, + "step": 46415 + }, + { + "epoch": 4.54, + "learning_rate": 3.927484085247717e-06, + "loss": 0.0797, + "step": 46420 + }, + { + "epoch": 4.54, + "learning_rate": 3.923332410738998e-06, + "loss": 0.0952, + "step": 46425 + }, + { + "epoch": 4.54, + "learning_rate": 3.91918073623028e-06, + "loss": 0.0942, + "step": 46430 + }, + { + "epoch": 4.54, + "learning_rate": 3.915029061721561e-06, + "loss": 0.0836, + "step": 46435 + }, + { + "epoch": 4.54, + "learning_rate": 3.910877387212842e-06, + "loss": 0.0972, + "step": 46440 + }, + { + "epoch": 4.54, + "learning_rate": 3.906725712704124e-06, + "loss": 0.0958, + "step": 46445 + }, + { + "epoch": 4.54, + "learning_rate": 3.902574038195405e-06, + "loss": 0.0758, + "step": 46450 + }, + { + "epoch": 4.54, + "learning_rate": 3.898422363686688e-06, + "loss": 0.0836, + "step": 46455 + }, + { + "epoch": 4.54, + "learning_rate": 3.894270689177968e-06, + "loss": 0.1016, + "step": 46460 + }, + { + "epoch": 4.54, + "learning_rate": 3.89011901466925e-06, + "loss": 0.0958, + "step": 46465 + }, + { + "epoch": 4.54, + "learning_rate": 3.885967340160532e-06, + "loss": 0.0845, + "step": 46470 + }, + { + "epoch": 4.54, + "learning_rate": 3.881815665651813e-06, + "loss": 0.1, + "step": 46475 + }, + { + "epoch": 4.54, + "learning_rate": 3.877663991143095e-06, + "loss": 0.0923, + "step": 46480 + }, + { + "epoch": 4.55, + "learning_rate": 3.873512316634376e-06, + "loss": 0.0852, + "step": 46485 + }, + { + "epoch": 4.55, + "learning_rate": 3.869360642125657e-06, + "loss": 0.0726, + "step": 46490 + }, + { + "epoch": 4.55, + "learning_rate": 3.865208967616939e-06, + "loss": 0.1082, + "step": 46495 + }, + { + "epoch": 4.55, + "learning_rate": 3.8610572931082205e-06, + "loss": 0.0728, + "step": 46500 + }, + { + "epoch": 4.55, + "eval_cer": 0.0530613613398355, + "eval_loss": 0.22180874645709991, + "eval_runtime": 278.1081, + "eval_samples_per_second": 58.862, + "eval_steps_per_second": 1.636, + "eval_wer": 0.1358077091345997, + "step": 46500 + }, + { + "epoch": 4.55, + "learning_rate": 3.856905618599501e-06, + "loss": 0.082, + "step": 46505 + }, + { + "epoch": 4.55, + "learning_rate": 3.852753944090784e-06, + "loss": 0.1224, + "step": 46510 + }, + { + "epoch": 4.55, + "learning_rate": 3.8486022695820645e-06, + "loss": 0.0844, + "step": 46515 + }, + { + "epoch": 4.55, + "learning_rate": 3.844450595073347e-06, + "loss": 0.0881, + "step": 46520 + }, + { + "epoch": 4.55, + "learning_rate": 3.840298920564628e-06, + "loss": 0.0832, + "step": 46525 + }, + { + "epoch": 4.55, + "learning_rate": 3.836147246055909e-06, + "loss": 0.1005, + "step": 46530 + }, + { + "epoch": 4.55, + "learning_rate": 3.831995571547191e-06, + "loss": 0.0815, + "step": 46535 + }, + { + "epoch": 4.55, + "learning_rate": 3.827843897038472e-06, + "loss": 0.0985, + "step": 46540 + }, + { + "epoch": 4.55, + "learning_rate": 3.823692222529754e-06, + "loss": 0.1014, + "step": 46545 + }, + { + "epoch": 4.55, + "learning_rate": 3.819540548021035e-06, + "loss": 0.0968, + "step": 46550 + }, + { + "epoch": 4.55, + "learning_rate": 3.8153888735123166e-06, + "loss": 0.0819, + "step": 46555 + }, + { + "epoch": 4.55, + "learning_rate": 3.8112371990035977e-06, + "loss": 0.1027, + "step": 46560 + }, + { + "epoch": 4.55, + "learning_rate": 3.80708552449488e-06, + "loss": 0.0844, + "step": 46565 + }, + { + "epoch": 4.55, + "learning_rate": 3.802933849986161e-06, + "loss": 0.0862, + "step": 46570 + }, + { + "epoch": 4.55, + "learning_rate": 3.798782175477443e-06, + "loss": 0.0992, + "step": 46575 + }, + { + "epoch": 4.55, + "learning_rate": 3.794630500968724e-06, + "loss": 0.0888, + "step": 46580 + }, + { + "epoch": 4.56, + "learning_rate": 3.790478826460006e-06, + "loss": 0.0829, + "step": 46585 + }, + { + "epoch": 4.56, + "learning_rate": 3.786327151951287e-06, + "loss": 0.0909, + "step": 46590 + }, + { + "epoch": 4.56, + "learning_rate": 3.782175477442568e-06, + "loss": 0.107, + "step": 46595 + }, + { + "epoch": 4.56, + "learning_rate": 3.7780238029338502e-06, + "loss": 0.0948, + "step": 46600 + }, + { + "epoch": 4.56, + "learning_rate": 3.7738721284251314e-06, + "loss": 0.0794, + "step": 46605 + }, + { + "epoch": 4.56, + "learning_rate": 3.769720453916413e-06, + "loss": 0.1088, + "step": 46610 + }, + { + "epoch": 4.56, + "learning_rate": 3.7655687794076942e-06, + "loss": 0.0905, + "step": 46615 + }, + { + "epoch": 4.56, + "learning_rate": 3.7614171048989763e-06, + "loss": 0.0745, + "step": 46620 + }, + { + "epoch": 4.56, + "learning_rate": 3.7572654303902575e-06, + "loss": 0.1005, + "step": 46625 + }, + { + "epoch": 4.56, + "learning_rate": 3.753113755881539e-06, + "loss": 0.0921, + "step": 46630 + }, + { + "epoch": 4.56, + "learning_rate": 3.7489620813728203e-06, + "loss": 0.0738, + "step": 46635 + }, + { + "epoch": 4.56, + "learning_rate": 3.744810406864102e-06, + "loss": 0.0772, + "step": 46640 + }, + { + "epoch": 4.56, + "learning_rate": 3.7406587323553835e-06, + "loss": 0.093, + "step": 46645 + }, + { + "epoch": 4.56, + "learning_rate": 3.736507057846665e-06, + "loss": 0.0903, + "step": 46650 + }, + { + "epoch": 4.56, + "learning_rate": 3.7323553833379463e-06, + "loss": 0.0767, + "step": 46655 + }, + { + "epoch": 4.56, + "learning_rate": 3.728203708829228e-06, + "loss": 0.1072, + "step": 46660 + }, + { + "epoch": 4.56, + "learning_rate": 3.7240520343205096e-06, + "loss": 0.0919, + "step": 46665 + }, + { + "epoch": 4.56, + "learning_rate": 3.719900359811791e-06, + "loss": 0.0723, + "step": 46670 + }, + { + "epoch": 4.56, + "learning_rate": 3.715748685303072e-06, + "loss": 0.1074, + "step": 46675 + }, + { + "epoch": 4.56, + "learning_rate": 3.7115970107943536e-06, + "loss": 0.0989, + "step": 46680 + }, + { + "epoch": 4.57, + "learning_rate": 3.707445336285635e-06, + "loss": 0.0822, + "step": 46685 + }, + { + "epoch": 4.57, + "learning_rate": 3.7032936617769168e-06, + "loss": 0.0763, + "step": 46690 + }, + { + "epoch": 4.57, + "learning_rate": 3.6991419872681984e-06, + "loss": 0.1, + "step": 46695 + }, + { + "epoch": 4.57, + "learning_rate": 3.6949903127594796e-06, + "loss": 0.085, + "step": 46700 + }, + { + "epoch": 4.57, + "learning_rate": 3.690838638250761e-06, + "loss": 0.0749, + "step": 46705 + }, + { + "epoch": 4.57, + "learning_rate": 3.686686963742043e-06, + "loss": 0.0979, + "step": 46710 + }, + { + "epoch": 4.57, + "learning_rate": 3.6825352892333244e-06, + "loss": 0.09, + "step": 46715 + }, + { + "epoch": 4.57, + "learning_rate": 3.6783836147246056e-06, + "loss": 0.0772, + "step": 46720 + }, + { + "epoch": 4.57, + "learning_rate": 3.6742319402158872e-06, + "loss": 0.0924, + "step": 46725 + }, + { + "epoch": 4.57, + "learning_rate": 3.6700802657071684e-06, + "loss": 0.0993, + "step": 46730 + }, + { + "epoch": 4.57, + "learning_rate": 3.66592859119845e-06, + "loss": 0.0893, + "step": 46735 + }, + { + "epoch": 4.57, + "learning_rate": 3.6617769166897317e-06, + "loss": 0.0781, + "step": 46740 + }, + { + "epoch": 4.57, + "learning_rate": 3.657625242181013e-06, + "loss": 0.1167, + "step": 46745 + }, + { + "epoch": 4.57, + "learning_rate": 3.6534735676722945e-06, + "loss": 0.0906, + "step": 46750 + }, + { + "epoch": 4.57, + "learning_rate": 3.649321893163576e-06, + "loss": 0.0836, + "step": 46755 + }, + { + "epoch": 4.57, + "learning_rate": 3.6451702186548577e-06, + "loss": 0.0999, + "step": 46760 + }, + { + "epoch": 4.57, + "learning_rate": 3.641018544146139e-06, + "loss": 0.0848, + "step": 46765 + }, + { + "epoch": 4.57, + "learning_rate": 3.6368668696374205e-06, + "loss": 0.0889, + "step": 46770 + }, + { + "epoch": 4.57, + "learning_rate": 3.632715195128702e-06, + "loss": 0.0962, + "step": 46775 + }, + { + "epoch": 4.57, + "learning_rate": 3.6285635206199837e-06, + "loss": 0.0839, + "step": 46780 + }, + { + "epoch": 4.57, + "learning_rate": 3.624411846111265e-06, + "loss": 0.0812, + "step": 46785 + }, + { + "epoch": 4.58, + "learning_rate": 3.620260171602546e-06, + "loss": 0.0881, + "step": 46790 + }, + { + "epoch": 4.58, + "learning_rate": 3.6161084970938277e-06, + "loss": 0.099, + "step": 46795 + }, + { + "epoch": 4.58, + "learning_rate": 3.6119568225851094e-06, + "loss": 0.0852, + "step": 46800 + }, + { + "epoch": 4.58, + "learning_rate": 3.607805148076391e-06, + "loss": 0.0788, + "step": 46805 + }, + { + "epoch": 4.58, + "learning_rate": 3.6036534735676726e-06, + "loss": 0.105, + "step": 46810 + }, + { + "epoch": 4.58, + "learning_rate": 3.5995017990589538e-06, + "loss": 0.0905, + "step": 46815 + }, + { + "epoch": 4.58, + "learning_rate": 3.5953501245502354e-06, + "loss": 0.0666, + "step": 46820 + }, + { + "epoch": 4.58, + "learning_rate": 3.591198450041517e-06, + "loss": 0.1239, + "step": 46825 + }, + { + "epoch": 4.58, + "learning_rate": 3.5870467755327986e-06, + "loss": 0.0947, + "step": 46830 + }, + { + "epoch": 4.58, + "learning_rate": 3.58289510102408e-06, + "loss": 0.0866, + "step": 46835 + }, + { + "epoch": 4.58, + "learning_rate": 3.578743426515361e-06, + "loss": 0.0948, + "step": 46840 + }, + { + "epoch": 4.58, + "learning_rate": 3.5745917520066426e-06, + "loss": 0.0931, + "step": 46845 + }, + { + "epoch": 4.58, + "learning_rate": 3.5704400774979242e-06, + "loss": 0.0841, + "step": 46850 + }, + { + "epoch": 4.58, + "learning_rate": 3.566288402989206e-06, + "loss": 0.0907, + "step": 46855 + }, + { + "epoch": 4.58, + "learning_rate": 3.562136728480487e-06, + "loss": 0.0949, + "step": 46860 + }, + { + "epoch": 4.58, + "learning_rate": 3.5579850539717687e-06, + "loss": 0.0993, + "step": 46865 + }, + { + "epoch": 4.58, + "learning_rate": 3.5538333794630503e-06, + "loss": 0.0878, + "step": 46870 + }, + { + "epoch": 4.58, + "learning_rate": 3.549681704954332e-06, + "loss": 0.0974, + "step": 46875 + }, + { + "epoch": 4.58, + "learning_rate": 3.545530030445613e-06, + "loss": 0.0929, + "step": 46880 + }, + { + "epoch": 4.58, + "learning_rate": 3.5413783559368947e-06, + "loss": 0.0964, + "step": 46885 + }, + { + "epoch": 4.59, + "learning_rate": 3.5372266814281763e-06, + "loss": 0.0868, + "step": 46890 + }, + { + "epoch": 4.59, + "learning_rate": 3.5330750069194575e-06, + "loss": 0.1067, + "step": 46895 + }, + { + "epoch": 4.59, + "learning_rate": 3.528923332410739e-06, + "loss": 0.0936, + "step": 46900 + }, + { + "epoch": 4.59, + "learning_rate": 3.5247716579020203e-06, + "loss": 0.0836, + "step": 46905 + }, + { + "epoch": 4.59, + "learning_rate": 3.520619983393302e-06, + "loss": 0.0984, + "step": 46910 + }, + { + "epoch": 4.59, + "learning_rate": 3.5164683088845836e-06, + "loss": 0.0872, + "step": 46915 + }, + { + "epoch": 4.59, + "learning_rate": 3.512316634375865e-06, + "loss": 0.0824, + "step": 46920 + }, + { + "epoch": 4.59, + "learning_rate": 3.5081649598671464e-06, + "loss": 0.097, + "step": 46925 + }, + { + "epoch": 4.59, + "learning_rate": 3.504013285358428e-06, + "loss": 0.0927, + "step": 46930 + }, + { + "epoch": 4.59, + "learning_rate": 3.4998616108497096e-06, + "loss": 0.0827, + "step": 46935 + }, + { + "epoch": 4.59, + "learning_rate": 3.495709936340991e-06, + "loss": 0.0819, + "step": 46940 + }, + { + "epoch": 4.59, + "learning_rate": 3.491558261832273e-06, + "loss": 0.0976, + "step": 46945 + }, + { + "epoch": 4.59, + "learning_rate": 3.4874065873235536e-06, + "loss": 0.0834, + "step": 46950 + }, + { + "epoch": 4.59, + "learning_rate": 3.483254912814835e-06, + "loss": 0.0892, + "step": 46955 + }, + { + "epoch": 4.59, + "learning_rate": 3.479103238306117e-06, + "loss": 0.1104, + "step": 46960 + }, + { + "epoch": 4.59, + "learning_rate": 3.4749515637973984e-06, + "loss": 0.0976, + "step": 46965 + }, + { + "epoch": 4.59, + "learning_rate": 3.4707998892886796e-06, + "loss": 0.0789, + "step": 46970 + }, + { + "epoch": 4.59, + "learning_rate": 3.4666482147799612e-06, + "loss": 0.0937, + "step": 46975 + }, + { + "epoch": 4.59, + "learning_rate": 3.462496540271243e-06, + "loss": 0.0974, + "step": 46980 + }, + { + "epoch": 4.59, + "learning_rate": 3.4583448657625245e-06, + "loss": 0.0714, + "step": 46985 + }, + { + "epoch": 4.59, + "learning_rate": 3.454193191253806e-06, + "loss": 0.0649, + "step": 46990 + }, + { + "epoch": 4.6, + "learning_rate": 3.4500415167450873e-06, + "loss": 0.0974, + "step": 46995 + }, + { + "epoch": 4.6, + "learning_rate": 3.4458898422363685e-06, + "loss": 0.0824, + "step": 47000 + }, + { + "epoch": 4.6, + "eval_cer": 0.05325675016359478, + "eval_loss": 0.22053982317447662, + "eval_runtime": 274.339, + "eval_samples_per_second": 59.671, + "eval_steps_per_second": 1.659, + "eval_wer": 0.13649334282337422, + "step": 47000 + }, + { + "epoch": 4.6, + "learning_rate": 3.44173816772765e-06, + "loss": 0.0805, + "step": 47005 + }, + { + "epoch": 4.6, + "learning_rate": 3.4375864932189317e-06, + "loss": 0.1105, + "step": 47010 + }, + { + "epoch": 4.6, + "learning_rate": 3.4334348187102133e-06, + "loss": 0.088, + "step": 47015 + }, + { + "epoch": 4.6, + "learning_rate": 3.4292831442014945e-06, + "loss": 0.0847, + "step": 47020 + }, + { + "epoch": 4.6, + "learning_rate": 3.425131469692776e-06, + "loss": 0.0846, + "step": 47025 + }, + { + "epoch": 4.6, + "learning_rate": 3.4209797951840577e-06, + "loss": 0.0888, + "step": 47030 + }, + { + "epoch": 4.6, + "learning_rate": 3.4168281206753394e-06, + "loss": 0.0866, + "step": 47035 + }, + { + "epoch": 4.6, + "learning_rate": 3.4126764461666205e-06, + "loss": 0.0873, + "step": 47040 + }, + { + "epoch": 4.6, + "learning_rate": 3.408524771657902e-06, + "loss": 0.1005, + "step": 47045 + }, + { + "epoch": 4.6, + "learning_rate": 3.4043730971491838e-06, + "loss": 0.0851, + "step": 47050 + }, + { + "epoch": 4.6, + "learning_rate": 3.400221422640465e-06, + "loss": 0.0836, + "step": 47055 + }, + { + "epoch": 4.6, + "learning_rate": 3.3960697481317466e-06, + "loss": 0.0944, + "step": 47060 + }, + { + "epoch": 4.6, + "learning_rate": 3.3919180736230278e-06, + "loss": 0.0772, + "step": 47065 + }, + { + "epoch": 4.6, + "learning_rate": 3.3877663991143094e-06, + "loss": 0.0883, + "step": 47070 + }, + { + "epoch": 4.6, + "learning_rate": 3.383614724605591e-06, + "loss": 0.0935, + "step": 47075 + }, + { + "epoch": 4.6, + "learning_rate": 3.3794630500968726e-06, + "loss": 0.0935, + "step": 47080 + }, + { + "epoch": 4.6, + "learning_rate": 3.375311375588154e-06, + "loss": 0.0785, + "step": 47085 + }, + { + "epoch": 4.6, + "learning_rate": 3.3711597010794354e-06, + "loss": 0.0918, + "step": 47090 + }, + { + "epoch": 4.61, + "learning_rate": 3.367008026570717e-06, + "loss": 0.1006, + "step": 47095 + }, + { + "epoch": 4.61, + "learning_rate": 3.3628563520619987e-06, + "loss": 0.0759, + "step": 47100 + }, + { + "epoch": 4.61, + "learning_rate": 3.3587046775532803e-06, + "loss": 0.0756, + "step": 47105 + }, + { + "epoch": 4.61, + "learning_rate": 3.354553003044561e-06, + "loss": 0.1034, + "step": 47110 + }, + { + "epoch": 4.61, + "learning_rate": 3.3504013285358427e-06, + "loss": 0.0916, + "step": 47115 + }, + { + "epoch": 4.61, + "learning_rate": 3.3462496540271243e-06, + "loss": 0.0909, + "step": 47120 + }, + { + "epoch": 4.61, + "learning_rate": 3.342097979518406e-06, + "loss": 0.0995, + "step": 47125 + }, + { + "epoch": 4.61, + "learning_rate": 3.337946305009687e-06, + "loss": 0.0872, + "step": 47130 + }, + { + "epoch": 4.61, + "learning_rate": 3.3337946305009687e-06, + "loss": 0.0808, + "step": 47135 + }, + { + "epoch": 4.61, + "learning_rate": 3.3296429559922503e-06, + "loss": 0.0802, + "step": 47140 + }, + { + "epoch": 4.61, + "learning_rate": 3.325491281483532e-06, + "loss": 0.0959, + "step": 47145 + }, + { + "epoch": 4.61, + "learning_rate": 3.3213396069748135e-06, + "loss": 0.0875, + "step": 47150 + }, + { + "epoch": 4.61, + "learning_rate": 3.3171879324660947e-06, + "loss": 0.0795, + "step": 47155 + }, + { + "epoch": 4.61, + "learning_rate": 3.3130362579573764e-06, + "loss": 0.0977, + "step": 47160 + }, + { + "epoch": 4.61, + "learning_rate": 3.3088845834486575e-06, + "loss": 0.0827, + "step": 47165 + }, + { + "epoch": 4.61, + "learning_rate": 3.304732908939939e-06, + "loss": 0.0862, + "step": 47170 + }, + { + "epoch": 4.61, + "learning_rate": 3.3005812344312204e-06, + "loss": 0.0821, + "step": 47175 + }, + { + "epoch": 4.61, + "learning_rate": 3.296429559922502e-06, + "loss": 0.0914, + "step": 47180 + }, + { + "epoch": 4.61, + "learning_rate": 3.2922778854137836e-06, + "loss": 0.0856, + "step": 47185 + }, + { + "epoch": 4.61, + "learning_rate": 3.288126210905065e-06, + "loss": 0.0784, + "step": 47190 + }, + { + "epoch": 4.61, + "learning_rate": 3.283974536396347e-06, + "loss": 0.0992, + "step": 47195 + }, + { + "epoch": 4.62, + "learning_rate": 3.279822861887628e-06, + "loss": 0.0825, + "step": 47200 + }, + { + "epoch": 4.62, + "learning_rate": 3.2756711873789096e-06, + "loss": 0.076, + "step": 47205 + }, + { + "epoch": 4.62, + "learning_rate": 3.2715195128701912e-06, + "loss": 0.1016, + "step": 47210 + }, + { + "epoch": 4.62, + "learning_rate": 3.267367838361473e-06, + "loss": 0.0917, + "step": 47215 + }, + { + "epoch": 4.62, + "learning_rate": 3.263216163852754e-06, + "loss": 0.0836, + "step": 47220 + }, + { + "epoch": 4.62, + "learning_rate": 3.2590644893440352e-06, + "loss": 0.1161, + "step": 47225 + }, + { + "epoch": 4.62, + "learning_rate": 3.254912814835317e-06, + "loss": 0.0961, + "step": 47230 + }, + { + "epoch": 4.62, + "learning_rate": 3.2507611403265985e-06, + "loss": 0.0833, + "step": 47235 + }, + { + "epoch": 4.62, + "learning_rate": 3.24660946581788e-06, + "loss": 0.0847, + "step": 47240 + }, + { + "epoch": 4.62, + "learning_rate": 3.2424577913091613e-06, + "loss": 0.1034, + "step": 47245 + }, + { + "epoch": 4.62, + "learning_rate": 3.238306116800443e-06, + "loss": 0.0718, + "step": 47250 + }, + { + "epoch": 4.62, + "learning_rate": 3.2341544422917245e-06, + "loss": 0.097, + "step": 47255 + }, + { + "epoch": 4.62, + "learning_rate": 3.230002767783006e-06, + "loss": 0.1, + "step": 47260 + }, + { + "epoch": 4.62, + "learning_rate": 3.2258510932742877e-06, + "loss": 0.082, + "step": 47265 + }, + { + "epoch": 4.62, + "learning_rate": 3.221699418765569e-06, + "loss": 0.0919, + "step": 47270 + }, + { + "epoch": 4.62, + "learning_rate": 3.21754774425685e-06, + "loss": 0.0844, + "step": 47275 + }, + { + "epoch": 4.62, + "learning_rate": 3.2133960697481317e-06, + "loss": 0.09, + "step": 47280 + }, + { + "epoch": 4.62, + "learning_rate": 3.2092443952394134e-06, + "loss": 0.0773, + "step": 47285 + }, + { + "epoch": 4.62, + "learning_rate": 3.2050927207306945e-06, + "loss": 0.1011, + "step": 47290 + }, + { + "epoch": 4.62, + "learning_rate": 3.200941046221976e-06, + "loss": 0.0984, + "step": 47295 + }, + { + "epoch": 4.63, + "learning_rate": 3.1967893717132578e-06, + "loss": 0.082, + "step": 47300 + }, + { + "epoch": 4.63, + "learning_rate": 3.1926376972045394e-06, + "loss": 0.0858, + "step": 47305 + }, + { + "epoch": 4.63, + "learning_rate": 3.188486022695821e-06, + "loss": 0.1036, + "step": 47310 + }, + { + "epoch": 4.63, + "learning_rate": 3.184334348187102e-06, + "loss": 0.0793, + "step": 47315 + }, + { + "epoch": 4.63, + "learning_rate": 3.180182673678384e-06, + "loss": 0.0854, + "step": 47320 + }, + { + "epoch": 4.63, + "learning_rate": 3.1760309991696654e-06, + "loss": 0.0978, + "step": 47325 + }, + { + "epoch": 4.63, + "learning_rate": 3.1718793246609466e-06, + "loss": 0.0905, + "step": 47330 + }, + { + "epoch": 4.63, + "learning_rate": 3.167727650152228e-06, + "loss": 0.0891, + "step": 47335 + }, + { + "epoch": 4.63, + "learning_rate": 3.1635759756435094e-06, + "loss": 0.0782, + "step": 47340 + }, + { + "epoch": 4.63, + "learning_rate": 3.159424301134791e-06, + "loss": 0.1005, + "step": 47345 + }, + { + "epoch": 4.63, + "learning_rate": 3.1552726266260727e-06, + "loss": 0.0829, + "step": 47350 + }, + { + "epoch": 4.63, + "learning_rate": 3.1511209521173543e-06, + "loss": 0.0909, + "step": 47355 + }, + { + "epoch": 4.63, + "learning_rate": 3.1469692776086355e-06, + "loss": 0.1067, + "step": 47360 + }, + { + "epoch": 4.63, + "learning_rate": 3.142817603099917e-06, + "loss": 0.1029, + "step": 47365 + }, + { + "epoch": 4.63, + "learning_rate": 3.1386659285911987e-06, + "loss": 0.0806, + "step": 47370 + }, + { + "epoch": 4.63, + "learning_rate": 3.1345142540824803e-06, + "loss": 0.0922, + "step": 47375 + }, + { + "epoch": 4.63, + "learning_rate": 3.1303625795737615e-06, + "loss": 0.0962, + "step": 47380 + }, + { + "epoch": 4.63, + "learning_rate": 3.1262109050650427e-06, + "loss": 0.0819, + "step": 47385 + }, + { + "epoch": 4.63, + "learning_rate": 3.1220592305563243e-06, + "loss": 0.0855, + "step": 47390 + }, + { + "epoch": 4.63, + "learning_rate": 3.117907556047606e-06, + "loss": 0.1059, + "step": 47395 + }, + { + "epoch": 4.63, + "learning_rate": 3.1137558815388875e-06, + "loss": 0.0874, + "step": 47400 + }, + { + "epoch": 4.64, + "learning_rate": 3.1096042070301687e-06, + "loss": 0.0869, + "step": 47405 + }, + { + "epoch": 4.64, + "learning_rate": 3.1054525325214503e-06, + "loss": 0.1101, + "step": 47410 + }, + { + "epoch": 4.64, + "learning_rate": 3.101300858012732e-06, + "loss": 0.0914, + "step": 47415 + }, + { + "epoch": 4.64, + "learning_rate": 3.0971491835040136e-06, + "loss": 0.0875, + "step": 47420 + }, + { + "epoch": 4.64, + "learning_rate": 3.092997508995295e-06, + "loss": 0.0902, + "step": 47425 + }, + { + "epoch": 4.64, + "learning_rate": 3.0888458344865764e-06, + "loss": 0.0885, + "step": 47430 + }, + { + "epoch": 4.64, + "learning_rate": 3.0846941599778576e-06, + "loss": 0.0782, + "step": 47435 + }, + { + "epoch": 4.64, + "learning_rate": 3.080542485469139e-06, + "loss": 0.0826, + "step": 47440 + }, + { + "epoch": 4.64, + "learning_rate": 3.076390810960421e-06, + "loss": 0.0981, + "step": 47445 + }, + { + "epoch": 4.64, + "learning_rate": 3.072239136451702e-06, + "loss": 0.0805, + "step": 47450 + }, + { + "epoch": 4.64, + "learning_rate": 3.0680874619429836e-06, + "loss": 0.0775, + "step": 47455 + }, + { + "epoch": 4.64, + "learning_rate": 3.0639357874342652e-06, + "loss": 0.0948, + "step": 47460 + }, + { + "epoch": 4.64, + "learning_rate": 3.059784112925547e-06, + "loss": 0.0826, + "step": 47465 + }, + { + "epoch": 4.64, + "learning_rate": 3.0556324384168285e-06, + "loss": 0.0783, + "step": 47470 + }, + { + "epoch": 4.64, + "learning_rate": 3.0514807639081097e-06, + "loss": 0.0947, + "step": 47475 + }, + { + "epoch": 4.64, + "learning_rate": 3.0473290893993913e-06, + "loss": 0.087, + "step": 47480 + }, + { + "epoch": 4.64, + "learning_rate": 3.043177414890673e-06, + "loss": 0.087, + "step": 47485 + }, + { + "epoch": 4.64, + "learning_rate": 3.039025740381954e-06, + "loss": 0.0814, + "step": 47490 + }, + { + "epoch": 4.64, + "learning_rate": 3.0348740658732353e-06, + "loss": 0.1086, + "step": 47495 + }, + { + "epoch": 4.64, + "learning_rate": 3.030722391364517e-06, + "loss": 0.0794, + "step": 47500 + }, + { + "epoch": 4.64, + "eval_cer": 0.052934185182359046, + "eval_loss": 0.21984922885894775, + "eval_runtime": 337.5131, + "eval_samples_per_second": 48.502, + "eval_steps_per_second": 1.348, + "eval_wer": 0.13588606727045963, + "step": 47500 + }, + { + "epoch": 4.65, + "learning_rate": 3.0265707168557985e-06, + "loss": 0.0889, + "step": 47505 + }, + { + "epoch": 4.65, + "learning_rate": 3.02241904234708e-06, + "loss": 0.0991, + "step": 47510 + }, + { + "epoch": 4.65, + "learning_rate": 3.0182673678383617e-06, + "loss": 0.0858, + "step": 47515 + }, + { + "epoch": 4.65, + "learning_rate": 3.014115693329643e-06, + "loss": 0.0859, + "step": 47520 + }, + { + "epoch": 4.65, + "learning_rate": 3.0099640188209245e-06, + "loss": 0.1057, + "step": 47525 + }, + { + "epoch": 4.65, + "learning_rate": 3.005812344312206e-06, + "loss": 0.1005, + "step": 47530 + }, + { + "epoch": 4.65, + "learning_rate": 3.0016606698034878e-06, + "loss": 0.08, + "step": 47535 + }, + { + "epoch": 4.65, + "learning_rate": 2.997508995294769e-06, + "loss": 0.0955, + "step": 47540 + }, + { + "epoch": 4.65, + "learning_rate": 2.99335732078605e-06, + "loss": 0.1013, + "step": 47545 + }, + { + "epoch": 4.65, + "learning_rate": 2.9892056462773318e-06, + "loss": 0.0912, + "step": 47550 + }, + { + "epoch": 4.65, + "learning_rate": 2.9850539717686134e-06, + "loss": 0.0891, + "step": 47555 + }, + { + "epoch": 4.65, + "learning_rate": 2.980902297259895e-06, + "loss": 0.1069, + "step": 47560 + }, + { + "epoch": 4.65, + "learning_rate": 2.976750622751176e-06, + "loss": 0.0914, + "step": 47565 + }, + { + "epoch": 4.65, + "learning_rate": 2.972598948242458e-06, + "loss": 0.0725, + "step": 47570 + }, + { + "epoch": 4.65, + "learning_rate": 2.9684472737337394e-06, + "loss": 0.094, + "step": 47575 + }, + { + "epoch": 4.65, + "learning_rate": 2.964295599225021e-06, + "loss": 0.0917, + "step": 47580 + }, + { + "epoch": 4.65, + "learning_rate": 2.9601439247163022e-06, + "loss": 0.0879, + "step": 47585 + }, + { + "epoch": 4.65, + "learning_rate": 2.955992250207584e-06, + "loss": 0.0922, + "step": 47590 + }, + { + "epoch": 4.65, + "learning_rate": 2.9518405756988655e-06, + "loss": 0.1057, + "step": 47595 + }, + { + "epoch": 4.65, + "learning_rate": 2.9476889011901467e-06, + "loss": 0.0754, + "step": 47600 + }, + { + "epoch": 4.65, + "learning_rate": 2.9435372266814283e-06, + "loss": 0.0886, + "step": 47605 + }, + { + "epoch": 4.66, + "learning_rate": 2.9393855521727095e-06, + "loss": 0.103, + "step": 47610 + }, + { + "epoch": 4.66, + "learning_rate": 2.935233877663991e-06, + "loss": 0.0877, + "step": 47615 + }, + { + "epoch": 4.66, + "learning_rate": 2.9310822031552727e-06, + "loss": 0.0744, + "step": 47620 + }, + { + "epoch": 4.66, + "learning_rate": 2.9269305286465543e-06, + "loss": 0.091, + "step": 47625 + }, + { + "epoch": 4.66, + "learning_rate": 2.922778854137836e-06, + "loss": 0.0902, + "step": 47630 + }, + { + "epoch": 4.66, + "learning_rate": 2.918627179629117e-06, + "loss": 0.0745, + "step": 47635 + }, + { + "epoch": 4.66, + "learning_rate": 2.9144755051203987e-06, + "loss": 0.0868, + "step": 47640 + }, + { + "epoch": 4.66, + "learning_rate": 2.9103238306116803e-06, + "loss": 0.1096, + "step": 47645 + }, + { + "epoch": 4.66, + "learning_rate": 2.906172156102962e-06, + "loss": 0.0775, + "step": 47650 + }, + { + "epoch": 4.66, + "learning_rate": 2.9020204815942427e-06, + "loss": 0.0797, + "step": 47655 + }, + { + "epoch": 4.66, + "learning_rate": 2.8978688070855243e-06, + "loss": 0.1193, + "step": 47660 + }, + { + "epoch": 4.66, + "learning_rate": 2.893717132576806e-06, + "loss": 0.1085, + "step": 47665 + }, + { + "epoch": 4.66, + "learning_rate": 2.8895654580680876e-06, + "loss": 0.0754, + "step": 47670 + }, + { + "epoch": 4.66, + "learning_rate": 2.885413783559369e-06, + "loss": 0.0881, + "step": 47675 + }, + { + "epoch": 4.66, + "learning_rate": 2.8812621090506504e-06, + "loss": 0.0887, + "step": 47680 + }, + { + "epoch": 4.66, + "learning_rate": 2.877110434541932e-06, + "loss": 0.0883, + "step": 47685 + }, + { + "epoch": 4.66, + "learning_rate": 2.8729587600332136e-06, + "loss": 0.1019, + "step": 47690 + }, + { + "epoch": 4.66, + "learning_rate": 2.8688070855244952e-06, + "loss": 0.1181, + "step": 47695 + }, + { + "epoch": 4.66, + "learning_rate": 2.8646554110157764e-06, + "loss": 0.0844, + "step": 47700 + }, + { + "epoch": 4.66, + "learning_rate": 2.860503736507058e-06, + "loss": 0.0866, + "step": 47705 + }, + { + "epoch": 4.67, + "learning_rate": 2.8563520619983392e-06, + "loss": 0.0904, + "step": 47710 + }, + { + "epoch": 4.67, + "learning_rate": 2.852200387489621e-06, + "loss": 0.0802, + "step": 47715 + }, + { + "epoch": 4.67, + "learning_rate": 2.8480487129809025e-06, + "loss": 0.0811, + "step": 47720 + }, + { + "epoch": 4.67, + "learning_rate": 2.8438970384721836e-06, + "loss": 0.0975, + "step": 47725 + }, + { + "epoch": 4.67, + "learning_rate": 2.8397453639634653e-06, + "loss": 0.095, + "step": 47730 + }, + { + "epoch": 4.67, + "learning_rate": 2.835593689454747e-06, + "loss": 0.0839, + "step": 47735 + }, + { + "epoch": 4.67, + "learning_rate": 2.8314420149460285e-06, + "loss": 0.0778, + "step": 47740 + }, + { + "epoch": 4.67, + "learning_rate": 2.8272903404373097e-06, + "loss": 0.1022, + "step": 47745 + }, + { + "epoch": 4.67, + "learning_rate": 2.8231386659285913e-06, + "loss": 0.0866, + "step": 47750 + }, + { + "epoch": 4.67, + "learning_rate": 2.818986991419873e-06, + "loss": 0.0889, + "step": 47755 + }, + { + "epoch": 4.67, + "learning_rate": 2.814835316911154e-06, + "loss": 0.1211, + "step": 47760 + }, + { + "epoch": 4.67, + "learning_rate": 2.8106836424024357e-06, + "loss": 0.0891, + "step": 47765 + }, + { + "epoch": 4.67, + "learning_rate": 2.806531967893717e-06, + "loss": 0.0974, + "step": 47770 + }, + { + "epoch": 4.67, + "learning_rate": 2.8023802933849985e-06, + "loss": 0.1041, + "step": 47775 + }, + { + "epoch": 4.67, + "learning_rate": 2.79822861887628e-06, + "loss": 0.0879, + "step": 47780 + }, + { + "epoch": 4.67, + "learning_rate": 2.7940769443675618e-06, + "loss": 0.0692, + "step": 47785 + }, + { + "epoch": 4.67, + "learning_rate": 2.789925269858843e-06, + "loss": 0.0801, + "step": 47790 + }, + { + "epoch": 4.67, + "learning_rate": 2.7857735953501246e-06, + "loss": 0.0966, + "step": 47795 + }, + { + "epoch": 4.67, + "learning_rate": 2.781621920841406e-06, + "loss": 0.0871, + "step": 47800 + }, + { + "epoch": 4.67, + "learning_rate": 2.777470246332688e-06, + "loss": 0.0997, + "step": 47805 + }, + { + "epoch": 4.68, + "learning_rate": 2.7733185718239694e-06, + "loss": 0.0979, + "step": 47810 + }, + { + "epoch": 4.68, + "learning_rate": 2.76916689731525e-06, + "loss": 0.0841, + "step": 47815 + }, + { + "epoch": 4.68, + "learning_rate": 2.765015222806532e-06, + "loss": 0.0884, + "step": 47820 + }, + { + "epoch": 4.68, + "learning_rate": 2.7608635482978134e-06, + "loss": 0.0935, + "step": 47825 + }, + { + "epoch": 4.68, + "learning_rate": 2.756711873789095e-06, + "loss": 0.0818, + "step": 47830 + }, + { + "epoch": 4.68, + "learning_rate": 2.7525601992803766e-06, + "loss": 0.0812, + "step": 47835 + }, + { + "epoch": 4.68, + "learning_rate": 2.748408524771658e-06, + "loss": 0.0769, + "step": 47840 + }, + { + "epoch": 4.68, + "learning_rate": 2.7442568502629395e-06, + "loss": 0.1098, + "step": 47845 + }, + { + "epoch": 4.68, + "learning_rate": 2.740105175754221e-06, + "loss": 0.079, + "step": 47850 + }, + { + "epoch": 4.68, + "learning_rate": 2.7359535012455027e-06, + "loss": 0.0823, + "step": 47855 + }, + { + "epoch": 4.68, + "learning_rate": 2.731801826736784e-06, + "loss": 0.0965, + "step": 47860 + }, + { + "epoch": 4.68, + "learning_rate": 2.7276501522280655e-06, + "loss": 0.0817, + "step": 47865 + }, + { + "epoch": 4.68, + "learning_rate": 2.7234984777193467e-06, + "loss": 0.0878, + "step": 47870 + }, + { + "epoch": 4.68, + "learning_rate": 2.7193468032106283e-06, + "loss": 0.1112, + "step": 47875 + }, + { + "epoch": 4.68, + "learning_rate": 2.71519512870191e-06, + "loss": 0.1006, + "step": 47880 + }, + { + "epoch": 4.68, + "learning_rate": 2.711043454193191e-06, + "loss": 0.0929, + "step": 47885 + }, + { + "epoch": 4.68, + "learning_rate": 2.7068917796844727e-06, + "loss": 0.0788, + "step": 47890 + }, + { + "epoch": 4.68, + "learning_rate": 2.7027401051757543e-06, + "loss": 0.1154, + "step": 47895 + }, + { + "epoch": 4.68, + "learning_rate": 2.698588430667036e-06, + "loss": 0.0908, + "step": 47900 + }, + { + "epoch": 4.68, + "learning_rate": 2.694436756158317e-06, + "loss": 0.0706, + "step": 47905 + }, + { + "epoch": 4.68, + "learning_rate": 2.6902850816495988e-06, + "loss": 0.0895, + "step": 47910 + }, + { + "epoch": 4.69, + "learning_rate": 2.6861334071408804e-06, + "loss": 0.088, + "step": 47915 + }, + { + "epoch": 4.69, + "learning_rate": 2.681981732632162e-06, + "loss": 0.0737, + "step": 47920 + }, + { + "epoch": 4.69, + "learning_rate": 2.677830058123443e-06, + "loss": 0.111, + "step": 47925 + }, + { + "epoch": 4.69, + "learning_rate": 2.6736783836147244e-06, + "loss": 0.083, + "step": 47930 + }, + { + "epoch": 4.69, + "learning_rate": 2.669526709106006e-06, + "loss": 0.0875, + "step": 47935 + }, + { + "epoch": 4.69, + "learning_rate": 2.6653750345972876e-06, + "loss": 0.0784, + "step": 47940 + }, + { + "epoch": 4.69, + "learning_rate": 2.6612233600885692e-06, + "loss": 0.1128, + "step": 47945 + }, + { + "epoch": 4.69, + "learning_rate": 2.6570716855798504e-06, + "loss": 0.0761, + "step": 47950 + }, + { + "epoch": 4.69, + "learning_rate": 2.652920011071132e-06, + "loss": 0.073, + "step": 47955 + }, + { + "epoch": 4.69, + "learning_rate": 2.6487683365624136e-06, + "loss": 0.0928, + "step": 47960 + }, + { + "epoch": 4.69, + "learning_rate": 2.6446166620536953e-06, + "loss": 0.0757, + "step": 47965 + }, + { + "epoch": 4.69, + "learning_rate": 2.640464987544977e-06, + "loss": 0.0771, + "step": 47970 + }, + { + "epoch": 4.69, + "learning_rate": 2.636313313036258e-06, + "loss": 0.0908, + "step": 47975 + }, + { + "epoch": 4.69, + "learning_rate": 2.6321616385275393e-06, + "loss": 0.0934, + "step": 47980 + }, + { + "epoch": 4.69, + "learning_rate": 2.628009964018821e-06, + "loss": 0.0789, + "step": 47985 + }, + { + "epoch": 4.69, + "learning_rate": 2.6238582895101025e-06, + "loss": 0.0761, + "step": 47990 + }, + { + "epoch": 4.69, + "learning_rate": 2.6197066150013837e-06, + "loss": 0.096, + "step": 47995 + }, + { + "epoch": 4.69, + "learning_rate": 2.6155549404926653e-06, + "loss": 0.0823, + "step": 48000 + }, + { + "epoch": 4.69, + "eval_cer": 0.05266711525165849, + "eval_loss": 0.21994511783123016, + "eval_runtime": 290.3046, + "eval_samples_per_second": 56.389, + "eval_steps_per_second": 1.567, + "eval_wer": 0.13544203783391992, + "step": 48000 + }, + { + "epoch": 4.69, + "learning_rate": 2.611403265983947e-06, + "loss": 0.0718, + "step": 48005 + }, + { + "epoch": 4.69, + "learning_rate": 2.6072515914752285e-06, + "loss": 0.104, + "step": 48010 + }, + { + "epoch": 4.7, + "learning_rate": 2.60309991696651e-06, + "loss": 0.0833, + "step": 48015 + }, + { + "epoch": 4.7, + "learning_rate": 2.5989482424577913e-06, + "loss": 0.092, + "step": 48020 + }, + { + "epoch": 4.7, + "learning_rate": 2.594796567949073e-06, + "loss": 0.0917, + "step": 48025 + }, + { + "epoch": 4.7, + "learning_rate": 2.5906448934403546e-06, + "loss": 0.0886, + "step": 48030 + }, + { + "epoch": 4.7, + "learning_rate": 2.5864932189316358e-06, + "loss": 0.0843, + "step": 48035 + }, + { + "epoch": 4.7, + "learning_rate": 2.5823415444229174e-06, + "loss": 0.0751, + "step": 48040 + }, + { + "epoch": 4.7, + "learning_rate": 2.5781898699141986e-06, + "loss": 0.1029, + "step": 48045 + }, + { + "epoch": 4.7, + "learning_rate": 2.57403819540548e-06, + "loss": 0.0949, + "step": 48050 + }, + { + "epoch": 4.7, + "learning_rate": 2.569886520896762e-06, + "loss": 0.0685, + "step": 48055 + }, + { + "epoch": 4.7, + "learning_rate": 2.5657348463880434e-06, + "loss": 0.1212, + "step": 48060 + }, + { + "epoch": 4.7, + "learning_rate": 2.5615831718793246e-06, + "loss": 0.0819, + "step": 48065 + }, + { + "epoch": 4.7, + "learning_rate": 2.5574314973706062e-06, + "loss": 0.0738, + "step": 48070 + }, + { + "epoch": 4.7, + "learning_rate": 2.553279822861888e-06, + "loss": 0.1001, + "step": 48075 + }, + { + "epoch": 4.7, + "learning_rate": 2.5491281483531694e-06, + "loss": 0.089, + "step": 48080 + }, + { + "epoch": 4.7, + "learning_rate": 2.5449764738444506e-06, + "loss": 0.0742, + "step": 48085 + }, + { + "epoch": 4.7, + "learning_rate": 2.540824799335732e-06, + "loss": 0.0813, + "step": 48090 + }, + { + "epoch": 4.7, + "learning_rate": 2.5366731248270134e-06, + "loss": 0.096, + "step": 48095 + }, + { + "epoch": 4.7, + "learning_rate": 2.532521450318295e-06, + "loss": 0.0871, + "step": 48100 + }, + { + "epoch": 4.7, + "learning_rate": 2.5283697758095767e-06, + "loss": 0.0724, + "step": 48105 + }, + { + "epoch": 4.7, + "learning_rate": 2.524218101300858e-06, + "loss": 0.1061, + "step": 48110 + }, + { + "epoch": 4.7, + "learning_rate": 2.5200664267921395e-06, + "loss": 0.1075, + "step": 48115 + }, + { + "epoch": 4.71, + "learning_rate": 2.515914752283421e-06, + "loss": 0.0844, + "step": 48120 + }, + { + "epoch": 4.71, + "learning_rate": 2.5117630777747027e-06, + "loss": 0.0941, + "step": 48125 + }, + { + "epoch": 4.71, + "learning_rate": 2.5076114032659843e-06, + "loss": 0.0955, + "step": 48130 + }, + { + "epoch": 4.71, + "learning_rate": 2.5034597287572655e-06, + "loss": 0.082, + "step": 48135 + }, + { + "epoch": 4.71, + "learning_rate": 2.4993080542485467e-06, + "loss": 0.0821, + "step": 48140 + }, + { + "epoch": 4.71, + "learning_rate": 2.4951563797398283e-06, + "loss": 0.1042, + "step": 48145 + }, + { + "epoch": 4.71, + "learning_rate": 2.49100470523111e-06, + "loss": 0.0866, + "step": 48150 + }, + { + "epoch": 4.71, + "learning_rate": 2.486853030722391e-06, + "loss": 0.0872, + "step": 48155 + }, + { + "epoch": 4.71, + "learning_rate": 2.4827013562136728e-06, + "loss": 0.103, + "step": 48160 + }, + { + "epoch": 4.71, + "learning_rate": 2.4785496817049544e-06, + "loss": 0.0874, + "step": 48165 + }, + { + "epoch": 4.71, + "learning_rate": 2.474398007196236e-06, + "loss": 0.0747, + "step": 48170 + }, + { + "epoch": 4.71, + "learning_rate": 2.4702463326875176e-06, + "loss": 0.0987, + "step": 48175 + }, + { + "epoch": 4.71, + "learning_rate": 2.466094658178799e-06, + "loss": 0.0934, + "step": 48180 + }, + { + "epoch": 4.71, + "learning_rate": 2.4619429836700804e-06, + "loss": 0.0766, + "step": 48185 + }, + { + "epoch": 4.71, + "learning_rate": 2.457791309161362e-06, + "loss": 0.0899, + "step": 48190 + }, + { + "epoch": 4.71, + "learning_rate": 2.4536396346526432e-06, + "loss": 0.096, + "step": 48195 + }, + { + "epoch": 4.71, + "learning_rate": 2.449487960143925e-06, + "loss": 0.079, + "step": 48200 + }, + { + "epoch": 4.71, + "learning_rate": 2.445336285635206e-06, + "loss": 0.0861, + "step": 48205 + }, + { + "epoch": 4.71, + "learning_rate": 2.4411846111264876e-06, + "loss": 0.1161, + "step": 48210 + }, + { + "epoch": 4.71, + "learning_rate": 2.4370329366177693e-06, + "loss": 0.0882, + "step": 48215 + }, + { + "epoch": 4.72, + "learning_rate": 2.432881262109051e-06, + "loss": 0.0792, + "step": 48220 + }, + { + "epoch": 4.72, + "learning_rate": 2.428729587600332e-06, + "loss": 0.0972, + "step": 48225 + }, + { + "epoch": 4.72, + "learning_rate": 2.4245779130916137e-06, + "loss": 0.1016, + "step": 48230 + }, + { + "epoch": 4.72, + "learning_rate": 2.4204262385828953e-06, + "loss": 0.0976, + "step": 48235 + }, + { + "epoch": 4.72, + "learning_rate": 2.416274564074177e-06, + "loss": 0.0903, + "step": 48240 + }, + { + "epoch": 4.72, + "learning_rate": 2.4121228895654585e-06, + "loss": 0.0978, + "step": 48245 + }, + { + "epoch": 4.72, + "learning_rate": 2.4079712150567393e-06, + "loss": 0.0789, + "step": 48250 + }, + { + "epoch": 4.72, + "learning_rate": 2.403819540548021e-06, + "loss": 0.0796, + "step": 48255 + }, + { + "epoch": 4.72, + "learning_rate": 2.3996678660393025e-06, + "loss": 0.1118, + "step": 48260 + }, + { + "epoch": 4.72, + "learning_rate": 2.395516191530584e-06, + "loss": 0.0816, + "step": 48265 + }, + { + "epoch": 4.72, + "learning_rate": 2.3913645170218653e-06, + "loss": 0.0747, + "step": 48270 + }, + { + "epoch": 4.72, + "learning_rate": 2.387212842513147e-06, + "loss": 0.0905, + "step": 48275 + }, + { + "epoch": 4.72, + "learning_rate": 2.3830611680044286e-06, + "loss": 0.0846, + "step": 48280 + }, + { + "epoch": 4.72, + "learning_rate": 2.37890949349571e-06, + "loss": 0.0862, + "step": 48285 + }, + { + "epoch": 4.72, + "learning_rate": 2.374757818986992e-06, + "loss": 0.0884, + "step": 48290 + }, + { + "epoch": 4.72, + "learning_rate": 2.370606144478273e-06, + "loss": 0.1021, + "step": 48295 + }, + { + "epoch": 4.72, + "learning_rate": 2.3664544699695546e-06, + "loss": 0.0851, + "step": 48300 + }, + { + "epoch": 4.72, + "learning_rate": 2.362302795460836e-06, + "loss": 0.0795, + "step": 48305 + }, + { + "epoch": 4.72, + "learning_rate": 2.3581511209521174e-06, + "loss": 0.1142, + "step": 48310 + }, + { + "epoch": 4.72, + "learning_rate": 2.3539994464433986e-06, + "loss": 0.0778, + "step": 48315 + }, + { + "epoch": 4.72, + "learning_rate": 2.3498477719346802e-06, + "loss": 0.0953, + "step": 48320 + }, + { + "epoch": 4.73, + "learning_rate": 2.345696097425962e-06, + "loss": 0.1006, + "step": 48325 + }, + { + "epoch": 4.73, + "learning_rate": 2.3415444229172434e-06, + "loss": 0.0864, + "step": 48330 + }, + { + "epoch": 4.73, + "learning_rate": 2.337392748408525e-06, + "loss": 0.0902, + "step": 48335 + }, + { + "epoch": 4.73, + "learning_rate": 2.3332410738998063e-06, + "loss": 0.0843, + "step": 48340 + }, + { + "epoch": 4.73, + "learning_rate": 2.329089399391088e-06, + "loss": 0.1008, + "step": 48345 + }, + { + "epoch": 4.73, + "learning_rate": 2.3249377248823695e-06, + "loss": 0.0752, + "step": 48350 + }, + { + "epoch": 4.73, + "learning_rate": 2.320786050373651e-06, + "loss": 0.093, + "step": 48355 + }, + { + "epoch": 4.73, + "learning_rate": 2.316634375864932e-06, + "loss": 0.1157, + "step": 48360 + }, + { + "epoch": 4.73, + "learning_rate": 2.3124827013562135e-06, + "loss": 0.0904, + "step": 48365 + }, + { + "epoch": 4.73, + "learning_rate": 2.308331026847495e-06, + "loss": 0.074, + "step": 48370 + }, + { + "epoch": 4.73, + "learning_rate": 2.3041793523387767e-06, + "loss": 0.1096, + "step": 48375 + }, + { + "epoch": 4.73, + "learning_rate": 2.3000276778300583e-06, + "loss": 0.099, + "step": 48380 + }, + { + "epoch": 4.73, + "learning_rate": 2.2958760033213395e-06, + "loss": 0.0772, + "step": 48385 + }, + { + "epoch": 4.73, + "learning_rate": 2.291724328812621e-06, + "loss": 0.0876, + "step": 48390 + }, + { + "epoch": 4.73, + "learning_rate": 2.2875726543039028e-06, + "loss": 0.0923, + "step": 48395 + }, + { + "epoch": 4.73, + "learning_rate": 2.2834209797951844e-06, + "loss": 0.098, + "step": 48400 + }, + { + "epoch": 4.73, + "learning_rate": 2.2792693052864656e-06, + "loss": 0.0893, + "step": 48405 + }, + { + "epoch": 4.73, + "learning_rate": 2.275117630777747e-06, + "loss": 0.1131, + "step": 48410 + }, + { + "epoch": 4.73, + "learning_rate": 2.2709659562690284e-06, + "loss": 0.0955, + "step": 48415 + }, + { + "epoch": 4.73, + "learning_rate": 2.26681428176031e-06, + "loss": 0.0758, + "step": 48420 + }, + { + "epoch": 4.74, + "learning_rate": 2.2626626072515916e-06, + "loss": 0.092, + "step": 48425 + }, + { + "epoch": 4.74, + "learning_rate": 2.2585109327428728e-06, + "loss": 0.0846, + "step": 48430 + }, + { + "epoch": 4.74, + "learning_rate": 2.2543592582341544e-06, + "loss": 0.0882, + "step": 48435 + }, + { + "epoch": 4.74, + "learning_rate": 2.250207583725436e-06, + "loss": 0.105, + "step": 48440 + }, + { + "epoch": 4.74, + "learning_rate": 2.2460559092167176e-06, + "loss": 0.0971, + "step": 48445 + }, + { + "epoch": 4.74, + "learning_rate": 2.2419042347079992e-06, + "loss": 0.0848, + "step": 48450 + }, + { + "epoch": 4.74, + "learning_rate": 2.2377525601992804e-06, + "loss": 0.071, + "step": 48455 + }, + { + "epoch": 4.74, + "learning_rate": 2.233600885690562e-06, + "loss": 0.1126, + "step": 48460 + }, + { + "epoch": 4.74, + "learning_rate": 2.2294492111818432e-06, + "loss": 0.0947, + "step": 48465 + }, + { + "epoch": 4.74, + "learning_rate": 2.225297536673125e-06, + "loss": 0.0814, + "step": 48470 + }, + { + "epoch": 4.74, + "learning_rate": 2.221145862164406e-06, + "loss": 0.0856, + "step": 48475 + }, + { + "epoch": 4.74, + "learning_rate": 2.2169941876556877e-06, + "loss": 0.0853, + "step": 48480 + }, + { + "epoch": 4.74, + "learning_rate": 2.2128425131469693e-06, + "loss": 0.0752, + "step": 48485 + }, + { + "epoch": 4.74, + "learning_rate": 2.208690838638251e-06, + "loss": 0.0868, + "step": 48490 + }, + { + "epoch": 4.74, + "learning_rate": 2.2045391641295325e-06, + "loss": 0.105, + "step": 48495 + }, + { + "epoch": 4.74, + "learning_rate": 2.2003874896208137e-06, + "loss": 0.0849, + "step": 48500 + }, + { + "epoch": 4.74, + "eval_cer": 0.05253993909418204, + "eval_loss": 0.2175559103488922, + "eval_runtime": 274.3676, + "eval_samples_per_second": 59.664, + "eval_steps_per_second": 1.658, + "eval_wer": 0.13477599367911036, + "step": 48500 + }, + { + "epoch": 4.74, + "learning_rate": 2.1962358151120953e-06, + "loss": 0.0759, + "step": 48505 + }, + { + "epoch": 4.74, + "learning_rate": 2.192084140603377e-06, + "loss": 0.1015, + "step": 48510 + }, + { + "epoch": 4.74, + "learning_rate": 2.1879324660946586e-06, + "loss": 0.0847, + "step": 48515 + }, + { + "epoch": 4.74, + "learning_rate": 2.1837807915859393e-06, + "loss": 0.0756, + "step": 48520 + }, + { + "epoch": 4.74, + "learning_rate": 2.179629117077221e-06, + "loss": 0.0929, + "step": 48525 + }, + { + "epoch": 4.75, + "learning_rate": 2.1754774425685026e-06, + "loss": 0.1016, + "step": 48530 + }, + { + "epoch": 4.75, + "learning_rate": 2.171325768059784e-06, + "loss": 0.086, + "step": 48535 + }, + { + "epoch": 4.75, + "learning_rate": 2.1671740935510658e-06, + "loss": 0.1129, + "step": 48540 + }, + { + "epoch": 4.75, + "learning_rate": 2.163022419042347e-06, + "loss": 0.1048, + "step": 48545 + }, + { + "epoch": 4.75, + "learning_rate": 2.1588707445336286e-06, + "loss": 0.0821, + "step": 48550 + }, + { + "epoch": 4.75, + "learning_rate": 2.15471907002491e-06, + "loss": 0.0767, + "step": 48555 + }, + { + "epoch": 4.75, + "learning_rate": 2.150567395516192e-06, + "loss": 0.1087, + "step": 48560 + }, + { + "epoch": 4.75, + "learning_rate": 2.146415721007473e-06, + "loss": 0.0869, + "step": 48565 + }, + { + "epoch": 4.75, + "learning_rate": 2.1422640464987546e-06, + "loss": 0.0771, + "step": 48570 + }, + { + "epoch": 4.75, + "learning_rate": 2.138112371990036e-06, + "loss": 0.1017, + "step": 48575 + }, + { + "epoch": 4.75, + "learning_rate": 2.1339606974813174e-06, + "loss": 0.0934, + "step": 48580 + }, + { + "epoch": 4.75, + "learning_rate": 2.129809022972599e-06, + "loss": 0.0866, + "step": 48585 + }, + { + "epoch": 4.75, + "learning_rate": 2.1256573484638802e-06, + "loss": 0.0773, + "step": 48590 + }, + { + "epoch": 4.75, + "learning_rate": 2.121505673955162e-06, + "loss": 0.0998, + "step": 48595 + }, + { + "epoch": 4.75, + "learning_rate": 2.1173539994464435e-06, + "loss": 0.0848, + "step": 48600 + }, + { + "epoch": 4.75, + "learning_rate": 2.113202324937725e-06, + "loss": 0.0771, + "step": 48605 + }, + { + "epoch": 4.75, + "learning_rate": 2.1090506504290063e-06, + "loss": 0.1122, + "step": 48610 + }, + { + "epoch": 4.75, + "learning_rate": 2.104898975920288e-06, + "loss": 0.0925, + "step": 48615 + }, + { + "epoch": 4.75, + "learning_rate": 2.1007473014115695e-06, + "loss": 0.0812, + "step": 48620 + }, + { + "epoch": 4.75, + "learning_rate": 2.096595626902851e-06, + "loss": 0.0933, + "step": 48625 + }, + { + "epoch": 4.76, + "learning_rate": 2.0924439523941323e-06, + "loss": 0.0781, + "step": 48630 + }, + { + "epoch": 4.76, + "learning_rate": 2.0882922778854135e-06, + "loss": 0.077, + "step": 48635 + }, + { + "epoch": 4.76, + "learning_rate": 2.084140603376695e-06, + "loss": 0.0916, + "step": 48640 + }, + { + "epoch": 4.76, + "learning_rate": 2.0799889288679767e-06, + "loss": 0.111, + "step": 48645 + }, + { + "epoch": 4.76, + "learning_rate": 2.0758372543592584e-06, + "loss": 0.0769, + "step": 48650 + }, + { + "epoch": 4.76, + "learning_rate": 2.07168557985054e-06, + "loss": 0.0779, + "step": 48655 + }, + { + "epoch": 4.76, + "learning_rate": 2.067533905341821e-06, + "loss": 0.0998, + "step": 48660 + }, + { + "epoch": 4.76, + "learning_rate": 2.0633822308331028e-06, + "loss": 0.092, + "step": 48665 + }, + { + "epoch": 4.76, + "learning_rate": 2.0592305563243844e-06, + "loss": 0.0814, + "step": 48670 + }, + { + "epoch": 4.76, + "learning_rate": 2.055078881815666e-06, + "loss": 0.0991, + "step": 48675 + }, + { + "epoch": 4.76, + "learning_rate": 2.050927207306947e-06, + "loss": 0.0766, + "step": 48680 + }, + { + "epoch": 4.76, + "learning_rate": 2.0467755327982284e-06, + "loss": 0.0817, + "step": 48685 + }, + { + "epoch": 4.76, + "learning_rate": 2.04262385828951e-06, + "loss": 0.083, + "step": 48690 + }, + { + "epoch": 4.76, + "learning_rate": 2.0384721837807916e-06, + "loss": 0.1051, + "step": 48695 + }, + { + "epoch": 4.76, + "learning_rate": 2.0343205092720732e-06, + "loss": 0.0807, + "step": 48700 + }, + { + "epoch": 4.76, + "learning_rate": 2.0301688347633544e-06, + "loss": 0.0827, + "step": 48705 + }, + { + "epoch": 4.76, + "learning_rate": 2.026017160254636e-06, + "loss": 0.1103, + "step": 48710 + }, + { + "epoch": 4.76, + "learning_rate": 2.0218654857459177e-06, + "loss": 0.0866, + "step": 48715 + }, + { + "epoch": 4.76, + "learning_rate": 2.0177138112371993e-06, + "loss": 0.0799, + "step": 48720 + }, + { + "epoch": 4.76, + "learning_rate": 2.0135621367284805e-06, + "loss": 0.0905, + "step": 48725 + }, + { + "epoch": 4.76, + "learning_rate": 2.009410462219762e-06, + "loss": 0.0846, + "step": 48730 + }, + { + "epoch": 4.77, + "learning_rate": 2.0052587877110437e-06, + "loss": 0.078, + "step": 48735 + }, + { + "epoch": 4.77, + "learning_rate": 2.001107113202325e-06, + "loss": 0.0843, + "step": 48740 + }, + { + "epoch": 4.77, + "learning_rate": 1.9969554386936065e-06, + "loss": 0.0988, + "step": 48745 + }, + { + "epoch": 4.77, + "learning_rate": 1.9928037641848877e-06, + "loss": 0.0801, + "step": 48750 + }, + { + "epoch": 4.77, + "learning_rate": 1.9886520896761693e-06, + "loss": 0.0855, + "step": 48755 + }, + { + "epoch": 4.77, + "learning_rate": 1.984500415167451e-06, + "loss": 0.1045, + "step": 48760 + }, + { + "epoch": 4.77, + "learning_rate": 1.9803487406587326e-06, + "loss": 0.0844, + "step": 48765 + }, + { + "epoch": 4.77, + "learning_rate": 1.9761970661500137e-06, + "loss": 0.0908, + "step": 48770 + }, + { + "epoch": 4.77, + "learning_rate": 1.9720453916412954e-06, + "loss": 0.088, + "step": 48775 + }, + { + "epoch": 4.77, + "learning_rate": 1.967893717132577e-06, + "loss": 0.1045, + "step": 48780 + }, + { + "epoch": 4.77, + "learning_rate": 1.9637420426238586e-06, + "loss": 0.0787, + "step": 48785 + }, + { + "epoch": 4.77, + "learning_rate": 1.95959036811514e-06, + "loss": 0.0825, + "step": 48790 + }, + { + "epoch": 4.77, + "learning_rate": 1.955438693606421e-06, + "loss": 0.1165, + "step": 48795 + }, + { + "epoch": 4.77, + "learning_rate": 1.9512870190977026e-06, + "loss": 0.0883, + "step": 48800 + }, + { + "epoch": 4.77, + "learning_rate": 1.947135344588984e-06, + "loss": 0.0815, + "step": 48805 + }, + { + "epoch": 4.77, + "learning_rate": 1.942983670080266e-06, + "loss": 0.1017, + "step": 48810 + }, + { + "epoch": 4.77, + "learning_rate": 1.939662330473291e-06, + "loss": 0.0991, + "step": 48815 + }, + { + "epoch": 4.77, + "learning_rate": 1.9355106559645725e-06, + "loss": 0.0824, + "step": 48820 + }, + { + "epoch": 4.77, + "learning_rate": 1.931358981455854e-06, + "loss": 0.1018, + "step": 48825 + }, + { + "epoch": 4.77, + "learning_rate": 1.9272073069471353e-06, + "loss": 0.1008, + "step": 48830 + }, + { + "epoch": 4.78, + "learning_rate": 1.923055632438417e-06, + "loss": 0.0766, + "step": 48835 + }, + { + "epoch": 4.78, + "learning_rate": 1.9189039579296985e-06, + "loss": 0.0813, + "step": 48840 + }, + { + "epoch": 4.78, + "learning_rate": 1.91475228342098e-06, + "loss": 0.1138, + "step": 48845 + }, + { + "epoch": 4.78, + "learning_rate": 1.9106006089122613e-06, + "loss": 0.0818, + "step": 48850 + }, + { + "epoch": 4.78, + "learning_rate": 1.9064489344035427e-06, + "loss": 0.0819, + "step": 48855 + }, + { + "epoch": 4.78, + "learning_rate": 1.9022972598948241e-06, + "loss": 0.0985, + "step": 48860 + }, + { + "epoch": 4.78, + "learning_rate": 1.8981455853861057e-06, + "loss": 0.09, + "step": 48865 + }, + { + "epoch": 4.78, + "learning_rate": 1.8939939108773871e-06, + "loss": 0.0751, + "step": 48870 + }, + { + "epoch": 4.78, + "learning_rate": 1.8898422363686688e-06, + "loss": 0.1125, + "step": 48875 + }, + { + "epoch": 4.78, + "learning_rate": 1.8856905618599504e-06, + "loss": 0.0953, + "step": 48880 + }, + { + "epoch": 4.78, + "learning_rate": 1.8815388873512318e-06, + "loss": 0.0917, + "step": 48885 + }, + { + "epoch": 4.78, + "learning_rate": 1.8773872128425134e-06, + "loss": 0.0877, + "step": 48890 + }, + { + "epoch": 4.78, + "learning_rate": 1.8732355383337946e-06, + "loss": 0.0973, + "step": 48895 + }, + { + "epoch": 4.78, + "learning_rate": 1.8690838638250762e-06, + "loss": 0.0936, + "step": 48900 + }, + { + "epoch": 4.78, + "learning_rate": 1.8649321893163576e-06, + "loss": 0.0858, + "step": 48905 + }, + { + "epoch": 4.78, + "learning_rate": 1.8607805148076392e-06, + "loss": 0.0974, + "step": 48910 + }, + { + "epoch": 4.78, + "learning_rate": 1.8566288402989206e-06, + "loss": 0.077, + "step": 48915 + }, + { + "epoch": 4.78, + "learning_rate": 1.852477165790202e-06, + "loss": 0.0766, + "step": 48920 + }, + { + "epoch": 4.78, + "learning_rate": 1.8483254912814836e-06, + "loss": 0.1057, + "step": 48925 + }, + { + "epoch": 4.78, + "learning_rate": 1.844173816772765e-06, + "loss": 0.1045, + "step": 48930 + }, + { + "epoch": 4.79, + "learning_rate": 1.8400221422640467e-06, + "loss": 0.0836, + "step": 48935 + }, + { + "epoch": 4.79, + "learning_rate": 1.835870467755328e-06, + "loss": 0.0776, + "step": 48940 + }, + { + "epoch": 4.79, + "learning_rate": 1.8317187932466095e-06, + "loss": 0.1078, + "step": 48945 + }, + { + "epoch": 4.79, + "learning_rate": 1.8275671187378909e-06, + "loss": 0.0886, + "step": 48950 + }, + { + "epoch": 4.79, + "learning_rate": 1.8234154442291725e-06, + "loss": 0.0875, + "step": 48955 + }, + { + "epoch": 4.79, + "learning_rate": 1.819263769720454e-06, + "loss": 0.1078, + "step": 48960 + }, + { + "epoch": 4.79, + "learning_rate": 1.8151120952117355e-06, + "loss": 0.091, + "step": 48965 + }, + { + "epoch": 4.79, + "learning_rate": 1.810960420703017e-06, + "loss": 0.0849, + "step": 48970 + }, + { + "epoch": 4.79, + "learning_rate": 1.8068087461942983e-06, + "loss": 0.0947, + "step": 48975 + }, + { + "epoch": 4.79, + "learning_rate": 1.80265707168558e-06, + "loss": 0.092, + "step": 48980 + }, + { + "epoch": 4.79, + "learning_rate": 1.7985053971768613e-06, + "loss": 0.0745, + "step": 48985 + }, + { + "epoch": 4.79, + "learning_rate": 1.794353722668143e-06, + "loss": 0.0833, + "step": 48990 + }, + { + "epoch": 4.79, + "learning_rate": 1.7902020481594241e-06, + "loss": 0.0994, + "step": 48995 + }, + { + "epoch": 4.79, + "learning_rate": 1.7860503736507058e-06, + "loss": 0.095, + "step": 49000 + }, + { + "epoch": 4.79, + "eval_cer": 0.05287290939739312, + "eval_loss": 0.21845518052577972, + "eval_runtime": 280.174, + "eval_samples_per_second": 58.428, + "eval_steps_per_second": 1.624, + "eval_wer": 0.13540938861064494, + "step": 49000 + }, + { + "epoch": 4.79, + "learning_rate": 1.7818986991419874e-06, + "loss": 0.0886, + "step": 49005 + }, + { + "epoch": 4.79, + "learning_rate": 1.7777470246332688e-06, + "loss": 0.0973, + "step": 49010 + }, + { + "epoch": 4.79, + "learning_rate": 1.7735953501245504e-06, + "loss": 0.0797, + "step": 49015 + }, + { + "epoch": 4.79, + "learning_rate": 1.7694436756158318e-06, + "loss": 0.0838, + "step": 49020 + }, + { + "epoch": 4.79, + "learning_rate": 1.7652920011071132e-06, + "loss": 0.1042, + "step": 49025 + }, + { + "epoch": 4.79, + "learning_rate": 1.7611403265983946e-06, + "loss": 0.0962, + "step": 49030 + }, + { + "epoch": 4.79, + "learning_rate": 1.7569886520896762e-06, + "loss": 0.087, + "step": 49035 + }, + { + "epoch": 4.8, + "learning_rate": 1.7528369775809578e-06, + "loss": 0.0758, + "step": 49040 + }, + { + "epoch": 4.8, + "learning_rate": 1.7486853030722392e-06, + "loss": 0.1079, + "step": 49045 + }, + { + "epoch": 4.8, + "learning_rate": 1.7445336285635206e-06, + "loss": 0.0806, + "step": 49050 + }, + { + "epoch": 4.8, + "learning_rate": 1.740381954054802e-06, + "loss": 0.0821, + "step": 49055 + }, + { + "epoch": 4.8, + "learning_rate": 1.7362302795460837e-06, + "loss": 0.1083, + "step": 49060 + }, + { + "epoch": 4.8, + "learning_rate": 1.732078605037365e-06, + "loss": 0.0952, + "step": 49065 + }, + { + "epoch": 4.8, + "learning_rate": 1.7279269305286467e-06, + "loss": 0.0804, + "step": 49070 + }, + { + "epoch": 4.8, + "learning_rate": 1.723775256019928e-06, + "loss": 0.0936, + "step": 49075 + }, + { + "epoch": 4.8, + "learning_rate": 1.7196235815112095e-06, + "loss": 0.0896, + "step": 49080 + }, + { + "epoch": 4.8, + "learning_rate": 1.715471907002491e-06, + "loss": 0.0728, + "step": 49085 + }, + { + "epoch": 4.8, + "learning_rate": 1.7113202324937725e-06, + "loss": 0.0969, + "step": 49090 + }, + { + "epoch": 4.8, + "learning_rate": 1.7071685579850541e-06, + "loss": 0.0905, + "step": 49095 + }, + { + "epoch": 4.8, + "learning_rate": 1.7030168834763355e-06, + "loss": 0.0728, + "step": 49100 + }, + { + "epoch": 4.8, + "learning_rate": 1.698865208967617e-06, + "loss": 0.0983, + "step": 49105 + }, + { + "epoch": 4.8, + "learning_rate": 1.6947135344588983e-06, + "loss": 0.0957, + "step": 49110 + }, + { + "epoch": 4.8, + "learning_rate": 1.69056185995018e-06, + "loss": 0.0819, + "step": 49115 + }, + { + "epoch": 4.8, + "learning_rate": 1.6864101854414616e-06, + "loss": 0.0719, + "step": 49120 + }, + { + "epoch": 4.8, + "learning_rate": 1.682258510932743e-06, + "loss": 0.1047, + "step": 49125 + }, + { + "epoch": 4.8, + "learning_rate": 1.6781068364240246e-06, + "loss": 0.0852, + "step": 49130 + }, + { + "epoch": 4.8, + "learning_rate": 1.6739551619153058e-06, + "loss": 0.0742, + "step": 49135 + }, + { + "epoch": 4.81, + "learning_rate": 1.6698034874065874e-06, + "loss": 0.1011, + "step": 49140 + }, + { + "epoch": 4.81, + "learning_rate": 1.6656518128978688e-06, + "loss": 0.0971, + "step": 49145 + }, + { + "epoch": 4.81, + "learning_rate": 1.6615001383891504e-06, + "loss": 0.0899, + "step": 49150 + }, + { + "epoch": 4.81, + "learning_rate": 1.6573484638804318e-06, + "loss": 0.1041, + "step": 49155 + }, + { + "epoch": 4.81, + "learning_rate": 1.6531967893717132e-06, + "loss": 0.0982, + "step": 49160 + }, + { + "epoch": 4.81, + "learning_rate": 1.6490451148629948e-06, + "loss": 0.081, + "step": 49165 + }, + { + "epoch": 4.81, + "learning_rate": 1.6448934403542762e-06, + "loss": 0.0814, + "step": 49170 + }, + { + "epoch": 4.81, + "learning_rate": 1.6407417658455578e-06, + "loss": 0.1031, + "step": 49175 + }, + { + "epoch": 4.81, + "learning_rate": 1.6365900913368393e-06, + "loss": 0.0899, + "step": 49180 + }, + { + "epoch": 4.81, + "learning_rate": 1.6324384168281207e-06, + "loss": 0.0933, + "step": 49185 + }, + { + "epoch": 4.81, + "learning_rate": 1.628286742319402e-06, + "loss": 0.0836, + "step": 49190 + }, + { + "epoch": 4.81, + "learning_rate": 1.6241350678106837e-06, + "loss": 0.1079, + "step": 49195 + }, + { + "epoch": 4.81, + "learning_rate": 1.619983393301965e-06, + "loss": 0.0763, + "step": 49200 + }, + { + "epoch": 4.81, + "learning_rate": 1.6158317187932467e-06, + "loss": 0.0867, + "step": 49205 + }, + { + "epoch": 4.81, + "learning_rate": 1.6116800442845283e-06, + "loss": 0.0892, + "step": 49210 + }, + { + "epoch": 4.81, + "learning_rate": 1.6075283697758095e-06, + "loss": 0.077, + "step": 49215 + }, + { + "epoch": 4.81, + "learning_rate": 1.6033766952670911e-06, + "loss": 0.0766, + "step": 49220 + }, + { + "epoch": 4.81, + "learning_rate": 1.5992250207583725e-06, + "loss": 0.1253, + "step": 49225 + }, + { + "epoch": 4.81, + "learning_rate": 1.5950733462496541e-06, + "loss": 0.096, + "step": 49230 + }, + { + "epoch": 4.81, + "learning_rate": 1.5909216717409355e-06, + "loss": 0.0793, + "step": 49235 + }, + { + "epoch": 4.81, + "learning_rate": 1.586769997232217e-06, + "loss": 0.1016, + "step": 49240 + }, + { + "epoch": 4.82, + "learning_rate": 1.5826183227234986e-06, + "loss": 0.1077, + "step": 49245 + }, + { + "epoch": 4.82, + "learning_rate": 1.57846664821478e-06, + "loss": 0.072, + "step": 49250 + }, + { + "epoch": 4.82, + "learning_rate": 1.5743149737060616e-06, + "loss": 0.0888, + "step": 49255 + }, + { + "epoch": 4.82, + "learning_rate": 1.570163299197343e-06, + "loss": 0.1074, + "step": 49260 + }, + { + "epoch": 4.82, + "learning_rate": 1.5660116246886246e-06, + "loss": 0.0843, + "step": 49265 + }, + { + "epoch": 4.82, + "learning_rate": 1.5618599501799058e-06, + "loss": 0.0761, + "step": 49270 + }, + { + "epoch": 4.82, + "learning_rate": 1.5577082756711874e-06, + "loss": 0.0969, + "step": 49275 + }, + { + "epoch": 4.82, + "learning_rate": 1.5535566011624688e-06, + "loss": 0.0959, + "step": 49280 + }, + { + "epoch": 4.82, + "learning_rate": 1.5494049266537504e-06, + "loss": 0.0819, + "step": 49285 + }, + { + "epoch": 4.82, + "learning_rate": 1.545253252145032e-06, + "loss": 0.0845, + "step": 49290 + }, + { + "epoch": 4.82, + "learning_rate": 1.5411015776363132e-06, + "loss": 0.1041, + "step": 49295 + }, + { + "epoch": 4.82, + "learning_rate": 1.5369499031275948e-06, + "loss": 0.0923, + "step": 49300 + }, + { + "epoch": 4.82, + "learning_rate": 1.5327982286188763e-06, + "loss": 0.0795, + "step": 49305 + }, + { + "epoch": 4.82, + "learning_rate": 1.5286465541101579e-06, + "loss": 0.1116, + "step": 49310 + }, + { + "epoch": 4.82, + "learning_rate": 1.5244948796014393e-06, + "loss": 0.1038, + "step": 49315 + }, + { + "epoch": 4.82, + "learning_rate": 1.5203432050927209e-06, + "loss": 0.083, + "step": 49320 + }, + { + "epoch": 4.82, + "learning_rate": 1.5161915305840023e-06, + "loss": 0.0913, + "step": 49325 + }, + { + "epoch": 4.82, + "learning_rate": 1.5120398560752837e-06, + "loss": 0.0878, + "step": 49330 + }, + { + "epoch": 4.82, + "learning_rate": 1.5078881815665653e-06, + "loss": 0.0651, + "step": 49335 + }, + { + "epoch": 4.82, + "learning_rate": 1.5037365070578467e-06, + "loss": 0.0799, + "step": 49340 + }, + { + "epoch": 4.83, + "learning_rate": 1.4995848325491283e-06, + "loss": 0.1103, + "step": 49345 + }, + { + "epoch": 4.83, + "learning_rate": 1.4954331580404095e-06, + "loss": 0.08, + "step": 49350 + }, + { + "epoch": 4.83, + "learning_rate": 1.4912814835316911e-06, + "loss": 0.0881, + "step": 49355 + }, + { + "epoch": 4.83, + "learning_rate": 1.4871298090229725e-06, + "loss": 0.103, + "step": 49360 + }, + { + "epoch": 4.83, + "learning_rate": 1.4829781345142542e-06, + "loss": 0.0939, + "step": 49365 + }, + { + "epoch": 4.83, + "learning_rate": 1.4788264600055358e-06, + "loss": 0.0796, + "step": 49370 + }, + { + "epoch": 4.83, + "learning_rate": 1.474674785496817e-06, + "loss": 0.096, + "step": 49375 + }, + { + "epoch": 4.83, + "learning_rate": 1.4705231109880986e-06, + "loss": 0.0847, + "step": 49380 + }, + { + "epoch": 4.83, + "learning_rate": 1.46637143647938e-06, + "loss": 0.0951, + "step": 49385 + }, + { + "epoch": 4.83, + "learning_rate": 1.4622197619706616e-06, + "loss": 0.0767, + "step": 49390 + }, + { + "epoch": 4.83, + "learning_rate": 1.458068087461943e-06, + "loss": 0.1163, + "step": 49395 + }, + { + "epoch": 4.83, + "learning_rate": 1.4539164129532246e-06, + "loss": 0.0864, + "step": 49400 + }, + { + "epoch": 4.83, + "learning_rate": 1.4497647384445058e-06, + "loss": 0.0884, + "step": 49405 + }, + { + "epoch": 4.83, + "learning_rate": 1.4456130639357874e-06, + "loss": 0.1075, + "step": 49410 + }, + { + "epoch": 4.83, + "learning_rate": 1.441461389427069e-06, + "loss": 0.0882, + "step": 49415 + }, + { + "epoch": 4.83, + "learning_rate": 1.4373097149183504e-06, + "loss": 0.0719, + "step": 49420 + }, + { + "epoch": 4.83, + "learning_rate": 1.433158040409632e-06, + "loss": 0.1013, + "step": 49425 + }, + { + "epoch": 4.83, + "learning_rate": 1.4290063659009132e-06, + "loss": 0.0838, + "step": 49430 + }, + { + "epoch": 4.83, + "learning_rate": 1.4248546913921949e-06, + "loss": 0.0853, + "step": 49435 + }, + { + "epoch": 4.83, + "learning_rate": 1.4207030168834763e-06, + "loss": 0.0895, + "step": 49440 + }, + { + "epoch": 4.83, + "learning_rate": 1.4165513423747579e-06, + "loss": 0.1007, + "step": 49445 + }, + { + "epoch": 4.84, + "learning_rate": 1.4123996678660395e-06, + "loss": 0.0833, + "step": 49450 + }, + { + "epoch": 4.84, + "learning_rate": 1.408247993357321e-06, + "loss": 0.0807, + "step": 49455 + }, + { + "epoch": 4.84, + "learning_rate": 1.4040963188486023e-06, + "loss": 0.0916, + "step": 49460 + }, + { + "epoch": 4.84, + "learning_rate": 1.3999446443398837e-06, + "loss": 0.077, + "step": 49465 + }, + { + "epoch": 4.84, + "learning_rate": 1.3957929698311653e-06, + "loss": 0.0819, + "step": 49470 + }, + { + "epoch": 4.84, + "learning_rate": 1.3916412953224467e-06, + "loss": 0.1015, + "step": 49475 + }, + { + "epoch": 4.84, + "learning_rate": 1.3874896208137283e-06, + "loss": 0.1046, + "step": 49480 + }, + { + "epoch": 4.84, + "learning_rate": 1.3833379463050095e-06, + "loss": 0.0829, + "step": 49485 + }, + { + "epoch": 4.84, + "learning_rate": 1.3791862717962912e-06, + "loss": 0.0759, + "step": 49490 + }, + { + "epoch": 4.84, + "learning_rate": 1.3750345972875728e-06, + "loss": 0.1161, + "step": 49495 + }, + { + "epoch": 4.84, + "learning_rate": 1.3708829227788542e-06, + "loss": 0.0951, + "step": 49500 + }, + { + "epoch": 4.84, + "eval_cer": 0.05266595910477234, + "eval_loss": 0.21632133424282074, + "eval_runtime": 324.3532, + "eval_samples_per_second": 50.47, + "eval_steps_per_second": 1.403, + "eval_wer": 0.135357149853405, + "step": 49500 + }, + { + "epoch": 4.84, + "learning_rate": 1.3667312482701358e-06, + "loss": 0.0818, + "step": 49505 + }, + { + "epoch": 4.84, + "learning_rate": 1.362579573761417e-06, + "loss": 0.105, + "step": 49510 + }, + { + "epoch": 4.84, + "learning_rate": 1.3584278992526986e-06, + "loss": 0.0909, + "step": 49515 + }, + { + "epoch": 4.84, + "learning_rate": 1.35427622474398e-06, + "loss": 0.0827, + "step": 49520 + }, + { + "epoch": 4.84, + "learning_rate": 1.3501245502352616e-06, + "loss": 0.0867, + "step": 49525 + }, + { + "epoch": 4.84, + "learning_rate": 1.3459728757265432e-06, + "loss": 0.0857, + "step": 49530 + }, + { + "epoch": 4.84, + "learning_rate": 1.3418212012178246e-06, + "loss": 0.0756, + "step": 49535 + }, + { + "epoch": 4.84, + "learning_rate": 1.337669526709106e-06, + "loss": 0.0852, + "step": 49540 + }, + { + "epoch": 4.84, + "learning_rate": 1.3335178522003874e-06, + "loss": 0.1072, + "step": 49545 + }, + { + "epoch": 4.85, + "learning_rate": 1.329366177691669e-06, + "loss": 0.0863, + "step": 49550 + }, + { + "epoch": 4.85, + "learning_rate": 1.3252145031829505e-06, + "loss": 0.0795, + "step": 49555 + }, + { + "epoch": 4.85, + "learning_rate": 1.321062828674232e-06, + "loss": 0.1132, + "step": 49560 + }, + { + "epoch": 4.85, + "learning_rate": 1.3169111541655133e-06, + "loss": 0.0814, + "step": 49565 + }, + { + "epoch": 4.85, + "learning_rate": 1.3127594796567949e-06, + "loss": 0.0967, + "step": 49570 + }, + { + "epoch": 4.85, + "learning_rate": 1.3086078051480765e-06, + "loss": 0.0886, + "step": 49575 + }, + { + "epoch": 4.85, + "learning_rate": 1.304456130639358e-06, + "loss": 0.0936, + "step": 49580 + }, + { + "epoch": 4.85, + "learning_rate": 1.3003044561306395e-06, + "loss": 0.0944, + "step": 49585 + }, + { + "epoch": 4.85, + "learning_rate": 1.296152781621921e-06, + "loss": 0.0835, + "step": 49590 + }, + { + "epoch": 4.85, + "learning_rate": 1.2920011071132023e-06, + "loss": 0.1127, + "step": 49595 + }, + { + "epoch": 4.85, + "learning_rate": 1.2878494326044837e-06, + "loss": 0.0953, + "step": 49600 + }, + { + "epoch": 4.85, + "learning_rate": 1.2836977580957653e-06, + "loss": 0.0813, + "step": 49605 + }, + { + "epoch": 4.85, + "learning_rate": 1.2795460835870467e-06, + "loss": 0.093, + "step": 49610 + }, + { + "epoch": 4.85, + "learning_rate": 1.2753944090783284e-06, + "loss": 0.0915, + "step": 49615 + }, + { + "epoch": 4.85, + "learning_rate": 1.2712427345696098e-06, + "loss": 0.0862, + "step": 49620 + }, + { + "epoch": 4.85, + "learning_rate": 1.2670910600608912e-06, + "loss": 0.0933, + "step": 49625 + }, + { + "epoch": 4.85, + "learning_rate": 1.2629393855521728e-06, + "loss": 0.0921, + "step": 49630 + }, + { + "epoch": 4.85, + "learning_rate": 1.2587877110434542e-06, + "loss": 0.0828, + "step": 49635 + }, + { + "epoch": 4.85, + "learning_rate": 1.2546360365347358e-06, + "loss": 0.0797, + "step": 49640 + }, + { + "epoch": 4.85, + "learning_rate": 1.2504843620260172e-06, + "loss": 0.0883, + "step": 49645 + }, + { + "epoch": 4.85, + "learning_rate": 1.2463326875172986e-06, + "loss": 0.0798, + "step": 49650 + }, + { + "epoch": 4.86, + "learning_rate": 1.2421810130085802e-06, + "loss": 0.0961, + "step": 49655 + }, + { + "epoch": 4.86, + "learning_rate": 1.2380293384998616e-06, + "loss": 0.1028, + "step": 49660 + }, + { + "epoch": 4.86, + "learning_rate": 1.2338776639911432e-06, + "loss": 0.085, + "step": 49665 + }, + { + "epoch": 4.86, + "learning_rate": 1.2297259894824246e-06, + "loss": 0.0771, + "step": 49670 + }, + { + "epoch": 4.86, + "learning_rate": 1.225574314973706e-06, + "loss": 0.1031, + "step": 49675 + }, + { + "epoch": 4.86, + "learning_rate": 1.2214226404649875e-06, + "loss": 0.0942, + "step": 49680 + }, + { + "epoch": 4.86, + "learning_rate": 1.217270965956269e-06, + "loss": 0.0839, + "step": 49685 + }, + { + "epoch": 4.86, + "learning_rate": 1.2131192914475505e-06, + "loss": 0.0941, + "step": 49690 + }, + { + "epoch": 4.86, + "learning_rate": 1.208967616938832e-06, + "loss": 0.0882, + "step": 49695 + }, + { + "epoch": 4.86, + "learning_rate": 1.2048159424301135e-06, + "loss": 0.0831, + "step": 49700 + }, + { + "epoch": 4.86, + "learning_rate": 1.200664267921395e-06, + "loss": 0.0826, + "step": 49705 + }, + { + "epoch": 4.86, + "learning_rate": 1.1965125934126765e-06, + "loss": 0.1029, + "step": 49710 + }, + { + "epoch": 4.86, + "learning_rate": 1.192360918903958e-06, + "loss": 0.0793, + "step": 49715 + }, + { + "epoch": 4.86, + "learning_rate": 1.1882092443952395e-06, + "loss": 0.0762, + "step": 49720 + }, + { + "epoch": 4.86, + "learning_rate": 1.184057569886521e-06, + "loss": 0.0959, + "step": 49725 + }, + { + "epoch": 4.86, + "learning_rate": 1.1799058953778023e-06, + "loss": 0.0953, + "step": 49730 + }, + { + "epoch": 4.86, + "learning_rate": 1.175754220869084e-06, + "loss": 0.0774, + "step": 49735 + }, + { + "epoch": 4.86, + "learning_rate": 1.1716025463603654e-06, + "loss": 0.0925, + "step": 49740 + }, + { + "epoch": 4.86, + "learning_rate": 1.167450871851647e-06, + "loss": 0.0953, + "step": 49745 + }, + { + "epoch": 4.86, + "learning_rate": 1.1632991973429284e-06, + "loss": 0.079, + "step": 49750 + }, + { + "epoch": 4.87, + "learning_rate": 1.1591475228342098e-06, + "loss": 0.0886, + "step": 49755 + }, + { + "epoch": 4.87, + "learning_rate": 1.1549958483254912e-06, + "loss": 0.108, + "step": 49760 + }, + { + "epoch": 4.87, + "learning_rate": 1.1508441738167728e-06, + "loss": 0.0857, + "step": 49765 + }, + { + "epoch": 4.87, + "learning_rate": 1.1466924993080542e-06, + "loss": 0.0894, + "step": 49770 + }, + { + "epoch": 4.87, + "learning_rate": 1.1425408247993358e-06, + "loss": 0.0836, + "step": 49775 + }, + { + "epoch": 4.87, + "learning_rate": 1.1383891502906174e-06, + "loss": 0.0858, + "step": 49780 + }, + { + "epoch": 4.87, + "learning_rate": 1.1342374757818986e-06, + "loss": 0.0821, + "step": 49785 + }, + { + "epoch": 4.87, + "learning_rate": 1.1300858012731802e-06, + "loss": 0.0822, + "step": 49790 + }, + { + "epoch": 4.87, + "learning_rate": 1.1259341267644616e-06, + "loss": 0.1049, + "step": 49795 + }, + { + "epoch": 4.87, + "learning_rate": 1.1217824522557433e-06, + "loss": 0.0859, + "step": 49800 + }, + { + "epoch": 4.87, + "learning_rate": 1.1176307777470247e-06, + "loss": 0.0733, + "step": 49805 + }, + { + "epoch": 4.87, + "learning_rate": 1.113479103238306e-06, + "loss": 0.0951, + "step": 49810 + }, + { + "epoch": 4.87, + "learning_rate": 1.1093274287295875e-06, + "loss": 0.081, + "step": 49815 + }, + { + "epoch": 4.87, + "learning_rate": 1.105175754220869e-06, + "loss": 0.0825, + "step": 49820 + }, + { + "epoch": 4.87, + "learning_rate": 1.1010240797121507e-06, + "loss": 0.1053, + "step": 49825 + }, + { + "epoch": 4.87, + "learning_rate": 1.096872405203432e-06, + "loss": 0.0892, + "step": 49830 + }, + { + "epoch": 4.87, + "learning_rate": 1.0927207306947137e-06, + "loss": 0.0874, + "step": 49835 + }, + { + "epoch": 4.87, + "learning_rate": 1.088569056185995e-06, + "loss": 0.0937, + "step": 49840 + }, + { + "epoch": 4.87, + "learning_rate": 1.0844173816772765e-06, + "loss": 0.1115, + "step": 49845 + }, + { + "epoch": 4.87, + "learning_rate": 1.080265707168558e-06, + "loss": 0.088, + "step": 49850 + }, + { + "epoch": 4.88, + "learning_rate": 1.0761140326598395e-06, + "loss": 0.0875, + "step": 49855 + }, + { + "epoch": 4.88, + "learning_rate": 1.0719623581511212e-06, + "loss": 0.1057, + "step": 49860 + }, + { + "epoch": 4.88, + "learning_rate": 1.0678106836424024e-06, + "loss": 0.0764, + "step": 49865 + }, + { + "epoch": 4.88, + "learning_rate": 1.063659009133684e-06, + "loss": 0.0747, + "step": 49870 + }, + { + "epoch": 4.88, + "learning_rate": 1.0595073346249654e-06, + "loss": 0.0893, + "step": 49875 + }, + { + "epoch": 4.88, + "learning_rate": 1.055355660116247e-06, + "loss": 0.0858, + "step": 49880 + }, + { + "epoch": 4.88, + "learning_rate": 1.0512039856075284e-06, + "loss": 0.0825, + "step": 49885 + }, + { + "epoch": 4.88, + "learning_rate": 1.0470523110988098e-06, + "loss": 0.0825, + "step": 49890 + }, + { + "epoch": 4.88, + "learning_rate": 1.0429006365900912e-06, + "loss": 0.1117, + "step": 49895 + }, + { + "epoch": 4.88, + "learning_rate": 1.0387489620813728e-06, + "loss": 0.0775, + "step": 49900 + }, + { + "epoch": 4.88, + "learning_rate": 1.0345972875726544e-06, + "loss": 0.0851, + "step": 49905 + }, + { + "epoch": 4.88, + "learning_rate": 1.0304456130639358e-06, + "loss": 0.0961, + "step": 49910 + }, + { + "epoch": 4.88, + "learning_rate": 1.0262939385552174e-06, + "loss": 0.0893, + "step": 49915 + }, + { + "epoch": 4.88, + "learning_rate": 1.0221422640464986e-06, + "loss": 0.0878, + "step": 49920 + }, + { + "epoch": 4.88, + "learning_rate": 1.0179905895377803e-06, + "loss": 0.0922, + "step": 49925 + }, + { + "epoch": 4.88, + "learning_rate": 1.0138389150290617e-06, + "loss": 0.0984, + "step": 49930 + }, + { + "epoch": 4.88, + "learning_rate": 1.0096872405203433e-06, + "loss": 0.0811, + "step": 49935 + }, + { + "epoch": 4.88, + "learning_rate": 1.0055355660116249e-06, + "loss": 0.0806, + "step": 49940 + }, + { + "epoch": 4.88, + "learning_rate": 1.001383891502906e-06, + "loss": 0.1051, + "step": 49945 + }, + { + "epoch": 4.88, + "learning_rate": 9.972322169941877e-07, + "loss": 0.0759, + "step": 49950 + }, + { + "epoch": 4.88, + "learning_rate": 9.93080542485469e-07, + "loss": 0.0758, + "step": 49955 + }, + { + "epoch": 4.89, + "learning_rate": 9.889288679767507e-07, + "loss": 0.0968, + "step": 49960 + }, + { + "epoch": 4.89, + "learning_rate": 9.847771934680321e-07, + "loss": 0.0901, + "step": 49965 + }, + { + "epoch": 4.89, + "learning_rate": 9.806255189593137e-07, + "loss": 0.0787, + "step": 49970 + }, + { + "epoch": 4.89, + "learning_rate": 9.76473844450595e-07, + "loss": 0.0988, + "step": 49975 + }, + { + "epoch": 4.89, + "learning_rate": 9.723221699418765e-07, + "loss": 0.1129, + "step": 49980 + }, + { + "epoch": 4.89, + "learning_rate": 9.681704954331582e-07, + "loss": 0.0792, + "step": 49985 + }, + { + "epoch": 4.89, + "learning_rate": 9.640188209244396e-07, + "loss": 0.0705, + "step": 49990 + }, + { + "epoch": 4.89, + "learning_rate": 9.598671464157212e-07, + "loss": 0.1103, + "step": 49995 + }, + { + "epoch": 4.89, + "learning_rate": 9.557154719070024e-07, + "loss": 0.0902, + "step": 50000 + }, + { + "epoch": 4.89, + "eval_cer": 0.052514503862686746, + "eval_loss": 0.21631939709186554, + "eval_runtime": 282.1944, + "eval_samples_per_second": 58.01, + "eval_steps_per_second": 1.612, + "eval_wer": 0.1350241277760002, + "step": 50000 + }, + { + "epoch": 4.89, + "learning_rate": 9.51563797398284e-07, + "loss": 0.0909, + "step": 50005 + }, + { + "epoch": 4.89, + "learning_rate": 9.474121228895655e-07, + "loss": 0.1082, + "step": 50010 + }, + { + "epoch": 4.89, + "learning_rate": 9.43260448380847e-07, + "loss": 0.0771, + "step": 50015 + }, + { + "epoch": 4.89, + "learning_rate": 9.391087738721285e-07, + "loss": 0.0865, + "step": 50020 + }, + { + "epoch": 4.89, + "learning_rate": 9.349570993634099e-07, + "loss": 0.0969, + "step": 50025 + }, + { + "epoch": 4.89, + "learning_rate": 9.308054248546914e-07, + "loss": 0.0955, + "step": 50030 + }, + { + "epoch": 4.89, + "learning_rate": 9.266537503459728e-07, + "loss": 0.0832, + "step": 50035 + }, + { + "epoch": 4.89, + "learning_rate": 9.225020758372543e-07, + "loss": 0.0876, + "step": 50040 + }, + { + "epoch": 4.89, + "learning_rate": 9.18350401328536e-07, + "loss": 0.0983, + "step": 50045 + }, + { + "epoch": 4.89, + "learning_rate": 9.141987268198174e-07, + "loss": 0.0882, + "step": 50050 + }, + { + "epoch": 4.89, + "learning_rate": 9.100470523110989e-07, + "loss": 0.0767, + "step": 50055 + }, + { + "epoch": 4.9, + "learning_rate": 9.058953778023803e-07, + "loss": 0.1175, + "step": 50060 + }, + { + "epoch": 4.9, + "learning_rate": 9.017437032936618e-07, + "loss": 0.09, + "step": 50065 + }, + { + "epoch": 4.9, + "learning_rate": 8.975920287849433e-07, + "loss": 0.0857, + "step": 50070 + }, + { + "epoch": 4.9, + "learning_rate": 8.934403542762247e-07, + "loss": 0.1027, + "step": 50075 + }, + { + "epoch": 4.9, + "learning_rate": 8.892886797675062e-07, + "loss": 0.0914, + "step": 50080 + }, + { + "epoch": 4.9, + "learning_rate": 8.851370052587878e-07, + "loss": 0.0784, + "step": 50085 + }, + { + "epoch": 4.9, + "learning_rate": 8.809853307500692e-07, + "loss": 0.0696, + "step": 50090 + }, + { + "epoch": 4.9, + "learning_rate": 8.768336562413507e-07, + "loss": 0.1027, + "step": 50095 + }, + { + "epoch": 4.9, + "learning_rate": 8.726819817326321e-07, + "loss": 0.085, + "step": 50100 + }, + { + "epoch": 4.9, + "learning_rate": 8.685303072239136e-07, + "loss": 0.0962, + "step": 50105 + }, + { + "epoch": 4.9, + "learning_rate": 8.643786327151952e-07, + "loss": 0.1069, + "step": 50110 + }, + { + "epoch": 4.9, + "learning_rate": 8.602269582064766e-07, + "loss": 0.0947, + "step": 50115 + }, + { + "epoch": 4.9, + "learning_rate": 8.560752836977581e-07, + "loss": 0.0894, + "step": 50120 + }, + { + "epoch": 4.9, + "learning_rate": 8.519236091890397e-07, + "loss": 0.1014, + "step": 50125 + }, + { + "epoch": 4.9, + "learning_rate": 8.477719346803211e-07, + "loss": 0.094, + "step": 50130 + }, + { + "epoch": 4.9, + "learning_rate": 8.436202601716026e-07, + "loss": 0.0709, + "step": 50135 + }, + { + "epoch": 4.9, + "learning_rate": 8.394685856628841e-07, + "loss": 0.0938, + "step": 50140 + }, + { + "epoch": 4.9, + "learning_rate": 8.353169111541655e-07, + "loss": 0.0978, + "step": 50145 + }, + { + "epoch": 4.9, + "learning_rate": 8.31165236645447e-07, + "loss": 0.0811, + "step": 50150 + }, + { + "epoch": 4.9, + "learning_rate": 8.270135621367284e-07, + "loss": 0.0782, + "step": 50155 + }, + { + "epoch": 4.9, + "learning_rate": 8.228618876280099e-07, + "loss": 0.1113, + "step": 50160 + }, + { + "epoch": 4.91, + "learning_rate": 8.187102131192915e-07, + "loss": 0.0829, + "step": 50165 + }, + { + "epoch": 4.91, + "learning_rate": 8.14558538610573e-07, + "loss": 0.0903, + "step": 50170 + }, + { + "epoch": 4.91, + "learning_rate": 8.104068641018545e-07, + "loss": 0.0862, + "step": 50175 + }, + { + "epoch": 4.91, + "learning_rate": 8.06255189593136e-07, + "loss": 0.0924, + "step": 50180 + }, + { + "epoch": 4.91, + "learning_rate": 8.021035150844174e-07, + "loss": 0.0896, + "step": 50185 + }, + { + "epoch": 4.91, + "learning_rate": 7.979518405756989e-07, + "loss": 0.0752, + "step": 50190 + }, + { + "epoch": 4.91, + "learning_rate": 7.938001660669803e-07, + "loss": 0.1027, + "step": 50195 + }, + { + "epoch": 4.91, + "learning_rate": 7.896484915582618e-07, + "loss": 0.0875, + "step": 50200 + }, + { + "epoch": 4.91, + "learning_rate": 7.854968170495434e-07, + "loss": 0.0707, + "step": 50205 + }, + { + "epoch": 4.91, + "learning_rate": 7.813451425408248e-07, + "loss": 0.0952, + "step": 50210 + }, + { + "epoch": 4.91, + "learning_rate": 7.771934680321063e-07, + "loss": 0.0806, + "step": 50215 + }, + { + "epoch": 4.91, + "learning_rate": 7.730417935233878e-07, + "loss": 0.079, + "step": 50220 + }, + { + "epoch": 4.91, + "learning_rate": 7.688901190146692e-07, + "loss": 0.0999, + "step": 50225 + }, + { + "epoch": 4.91, + "learning_rate": 7.647384445059508e-07, + "loss": 0.0913, + "step": 50230 + }, + { + "epoch": 4.91, + "learning_rate": 7.605867699972323e-07, + "loss": 0.0829, + "step": 50235 + }, + { + "epoch": 4.91, + "learning_rate": 7.564350954885137e-07, + "loss": 0.0876, + "step": 50240 + }, + { + "epoch": 4.91, + "learning_rate": 7.522834209797952e-07, + "loss": 0.1113, + "step": 50245 + }, + { + "epoch": 4.91, + "learning_rate": 7.481317464710767e-07, + "loss": 0.0913, + "step": 50250 + }, + { + "epoch": 4.91, + "learning_rate": 7.439800719623582e-07, + "loss": 0.0926, + "step": 50255 + }, + { + "epoch": 4.91, + "learning_rate": 7.398283974536397e-07, + "loss": 0.1037, + "step": 50260 + }, + { + "epoch": 4.92, + "learning_rate": 7.356767229449211e-07, + "loss": 0.0935, + "step": 50265 + }, + { + "epoch": 4.92, + "learning_rate": 7.315250484362026e-07, + "loss": 0.0872, + "step": 50270 + }, + { + "epoch": 4.92, + "learning_rate": 7.273733739274841e-07, + "loss": 0.1004, + "step": 50275 + }, + { + "epoch": 4.92, + "learning_rate": 7.232216994187655e-07, + "loss": 0.0838, + "step": 50280 + }, + { + "epoch": 4.92, + "learning_rate": 7.19070024910047e-07, + "loss": 0.0868, + "step": 50285 + }, + { + "epoch": 4.92, + "learning_rate": 7.149183504013285e-07, + "loss": 0.0802, + "step": 50290 + }, + { + "epoch": 4.92, + "learning_rate": 7.107666758926101e-07, + "loss": 0.0907, + "step": 50295 + }, + { + "epoch": 4.92, + "learning_rate": 7.066150013838916e-07, + "loss": 0.0816, + "step": 50300 + }, + { + "epoch": 4.92, + "learning_rate": 7.02463326875173e-07, + "loss": 0.074, + "step": 50305 + }, + { + "epoch": 4.92, + "learning_rate": 6.983116523664545e-07, + "loss": 0.1107, + "step": 50310 + }, + { + "epoch": 4.92, + "learning_rate": 6.94159977857736e-07, + "loss": 0.0833, + "step": 50315 + }, + { + "epoch": 4.92, + "learning_rate": 6.900083033490174e-07, + "loss": 0.084, + "step": 50320 + }, + { + "epoch": 4.92, + "learning_rate": 6.858566288402989e-07, + "loss": 0.0887, + "step": 50325 + }, + { + "epoch": 4.92, + "learning_rate": 6.817049543315805e-07, + "loss": 0.0909, + "step": 50330 + }, + { + "epoch": 4.92, + "learning_rate": 6.775532798228619e-07, + "loss": 0.0789, + "step": 50335 + }, + { + "epoch": 4.92, + "learning_rate": 6.734016053141434e-07, + "loss": 0.0857, + "step": 50340 + }, + { + "epoch": 4.92, + "learning_rate": 6.692499308054248e-07, + "loss": 0.0908, + "step": 50345 + }, + { + "epoch": 4.92, + "learning_rate": 6.650982562967063e-07, + "loss": 0.0899, + "step": 50350 + }, + { + "epoch": 4.92, + "learning_rate": 6.609465817879879e-07, + "loss": 0.0864, + "step": 50355 + }, + { + "epoch": 4.92, + "learning_rate": 6.567949072792693e-07, + "loss": 0.1061, + "step": 50360 + }, + { + "epoch": 4.92, + "learning_rate": 6.526432327705508e-07, + "loss": 0.0874, + "step": 50365 + }, + { + "epoch": 4.93, + "learning_rate": 6.484915582618324e-07, + "loss": 0.0784, + "step": 50370 + }, + { + "epoch": 4.93, + "learning_rate": 6.443398837531138e-07, + "loss": 0.0865, + "step": 50375 + }, + { + "epoch": 4.93, + "learning_rate": 6.401882092443953e-07, + "loss": 0.1011, + "step": 50380 + }, + { + "epoch": 4.93, + "learning_rate": 6.360365347356767e-07, + "loss": 0.07, + "step": 50385 + }, + { + "epoch": 4.93, + "learning_rate": 6.318848602269582e-07, + "loss": 0.0821, + "step": 50390 + }, + { + "epoch": 4.93, + "learning_rate": 6.277331857182397e-07, + "loss": 0.0967, + "step": 50395 + }, + { + "epoch": 4.93, + "learning_rate": 6.235815112095211e-07, + "loss": 0.0909, + "step": 50400 + }, + { + "epoch": 4.93, + "learning_rate": 6.194298367008026e-07, + "loss": 0.0845, + "step": 50405 + }, + { + "epoch": 4.93, + "learning_rate": 6.152781621920842e-07, + "loss": 0.0985, + "step": 50410 + }, + { + "epoch": 4.93, + "learning_rate": 6.111264876833657e-07, + "loss": 0.0913, + "step": 50415 + }, + { + "epoch": 4.93, + "learning_rate": 6.069748131746472e-07, + "loss": 0.0755, + "step": 50420 + }, + { + "epoch": 4.93, + "learning_rate": 6.028231386659287e-07, + "loss": 0.1072, + "step": 50425 + }, + { + "epoch": 4.93, + "learning_rate": 5.986714641572101e-07, + "loss": 0.094, + "step": 50430 + }, + { + "epoch": 4.93, + "learning_rate": 5.945197896484916e-07, + "loss": 0.0802, + "step": 50435 + }, + { + "epoch": 4.93, + "learning_rate": 5.90368115139773e-07, + "loss": 0.1012, + "step": 50440 + }, + { + "epoch": 4.93, + "learning_rate": 5.862164406310545e-07, + "loss": 0.0885, + "step": 50445 + }, + { + "epoch": 4.93, + "learning_rate": 5.82064766122336e-07, + "loss": 0.0845, + "step": 50450 + }, + { + "epoch": 4.93, + "learning_rate": 5.779130916136175e-07, + "loss": 0.0813, + "step": 50455 + }, + { + "epoch": 4.93, + "learning_rate": 5.73761417104899e-07, + "loss": 0.1012, + "step": 50460 + }, + { + "epoch": 4.93, + "learning_rate": 5.696097425961805e-07, + "loss": 0.076, + "step": 50465 + }, + { + "epoch": 4.94, + "learning_rate": 5.654580680874619e-07, + "loss": 0.0845, + "step": 50470 + }, + { + "epoch": 4.94, + "learning_rate": 5.613063935787434e-07, + "loss": 0.0982, + "step": 50475 + }, + { + "epoch": 4.94, + "learning_rate": 5.571547190700249e-07, + "loss": 0.0942, + "step": 50480 + }, + { + "epoch": 4.94, + "learning_rate": 5.530030445613064e-07, + "loss": 0.0824, + "step": 50485 + }, + { + "epoch": 4.94, + "learning_rate": 5.488513700525879e-07, + "loss": 0.0752, + "step": 50490 + }, + { + "epoch": 4.94, + "learning_rate": 5.446996955438694e-07, + "loss": 0.105, + "step": 50495 + }, + { + "epoch": 4.94, + "learning_rate": 5.405480210351509e-07, + "loss": 0.066, + "step": 50500 + }, + { + "epoch": 4.94, + "eval_cer": 0.05246363339969617, + "eval_loss": 0.2166503667831421, + "eval_runtime": 278.3915, + "eval_samples_per_second": 58.802, + "eval_steps_per_second": 1.634, + "eval_wer": 0.1350371874653102, + "step": 50500 + }, + { + "epoch": 4.94, + "learning_rate": 5.363963465264324e-07, + "loss": 0.0845, + "step": 50505 + }, + { + "epoch": 4.94, + "learning_rate": 5.322446720177138e-07, + "loss": 0.105, + "step": 50510 + }, + { + "epoch": 4.94, + "learning_rate": 5.280929975089953e-07, + "loss": 0.0809, + "step": 50515 + }, + { + "epoch": 4.94, + "learning_rate": 5.239413230002768e-07, + "loss": 0.077, + "step": 50520 + }, + { + "epoch": 4.94, + "learning_rate": 5.197896484915582e-07, + "loss": 0.1099, + "step": 50525 + }, + { + "epoch": 4.94, + "learning_rate": 5.156379739828397e-07, + "loss": 0.1085, + "step": 50530 + }, + { + "epoch": 4.94, + "learning_rate": 5.114862994741212e-07, + "loss": 0.0813, + "step": 50535 + }, + { + "epoch": 4.94, + "learning_rate": 5.073346249654028e-07, + "loss": 0.0867, + "step": 50540 + }, + { + "epoch": 4.94, + "learning_rate": 5.031829504566843e-07, + "loss": 0.0951, + "step": 50545 + }, + { + "epoch": 4.94, + "learning_rate": 4.990312759479657e-07, + "loss": 0.0822, + "step": 50550 + }, + { + "epoch": 4.94, + "learning_rate": 4.948796014392472e-07, + "loss": 0.0841, + "step": 50555 + }, + { + "epoch": 4.94, + "learning_rate": 4.907279269305287e-07, + "loss": 0.0957, + "step": 50560 + }, + { + "epoch": 4.94, + "learning_rate": 4.865762524218101e-07, + "loss": 0.0813, + "step": 50565 + }, + { + "epoch": 4.94, + "learning_rate": 4.824245779130916e-07, + "loss": 0.088, + "step": 50570 + }, + { + "epoch": 4.95, + "learning_rate": 4.782729034043731e-07, + "loss": 0.0898, + "step": 50575 + }, + { + "epoch": 4.95, + "learning_rate": 4.7412122889565456e-07, + "loss": 0.0851, + "step": 50580 + }, + { + "epoch": 4.95, + "learning_rate": 4.6996955438693613e-07, + "loss": 0.0832, + "step": 50585 + }, + { + "epoch": 4.95, + "learning_rate": 4.658178798782176e-07, + "loss": 0.0906, + "step": 50590 + }, + { + "epoch": 4.95, + "learning_rate": 4.6166620536949904e-07, + "loss": 0.1108, + "step": 50595 + }, + { + "epoch": 4.95, + "learning_rate": 4.575145308607805e-07, + "loss": 0.0844, + "step": 50600 + }, + { + "epoch": 4.95, + "learning_rate": 4.5336285635206206e-07, + "loss": 0.0746, + "step": 50605 + }, + { + "epoch": 4.95, + "learning_rate": 4.492111818433435e-07, + "loss": 0.0994, + "step": 50610 + }, + { + "epoch": 4.95, + "learning_rate": 4.4505950733462497e-07, + "loss": 0.0882, + "step": 50615 + }, + { + "epoch": 4.95, + "learning_rate": 4.4090783282590643e-07, + "loss": 0.0734, + "step": 50620 + }, + { + "epoch": 4.95, + "learning_rate": 4.36756158317188e-07, + "loss": 0.0901, + "step": 50625 + }, + { + "epoch": 4.95, + "learning_rate": 4.3260448380846945e-07, + "loss": 0.0918, + "step": 50630 + }, + { + "epoch": 4.95, + "learning_rate": 4.284528092997509e-07, + "loss": 0.0885, + "step": 50635 + }, + { + "epoch": 4.95, + "learning_rate": 4.2430113479103236e-07, + "loss": 0.0837, + "step": 50640 + }, + { + "epoch": 4.95, + "learning_rate": 4.2014946028231387e-07, + "loss": 0.1085, + "step": 50645 + }, + { + "epoch": 4.95, + "learning_rate": 4.159977857735954e-07, + "loss": 0.0789, + "step": 50650 + }, + { + "epoch": 4.95, + "learning_rate": 4.1184611126487684e-07, + "loss": 0.0738, + "step": 50655 + }, + { + "epoch": 4.95, + "learning_rate": 4.076944367561583e-07, + "loss": 0.1012, + "step": 50660 + }, + { + "epoch": 4.95, + "learning_rate": 4.035427622474398e-07, + "loss": 0.0854, + "step": 50665 + }, + { + "epoch": 4.95, + "learning_rate": 3.993910877387213e-07, + "loss": 0.0777, + "step": 50670 + }, + { + "epoch": 4.96, + "learning_rate": 3.9523941323000277e-07, + "loss": 0.1077, + "step": 50675 + }, + { + "epoch": 4.96, + "learning_rate": 3.910877387212842e-07, + "loss": 0.0853, + "step": 50680 + }, + { + "epoch": 4.96, + "learning_rate": 3.8693606421256574e-07, + "loss": 0.0762, + "step": 50685 + }, + { + "epoch": 4.96, + "learning_rate": 3.8278438970384725e-07, + "loss": 0.0833, + "step": 50690 + }, + { + "epoch": 4.96, + "learning_rate": 3.786327151951287e-07, + "loss": 0.1091, + "step": 50695 + }, + { + "epoch": 4.96, + "learning_rate": 3.744810406864102e-07, + "loss": 0.0909, + "step": 50700 + }, + { + "epoch": 4.96, + "learning_rate": 3.7032936617769167e-07, + "loss": 0.0874, + "step": 50705 + }, + { + "epoch": 4.96, + "learning_rate": 3.661776916689732e-07, + "loss": 0.107, + "step": 50710 + }, + { + "epoch": 4.96, + "learning_rate": 3.6202601716025463e-07, + "loss": 0.0798, + "step": 50715 + }, + { + "epoch": 4.96, + "learning_rate": 3.5787434265153614e-07, + "loss": 0.0831, + "step": 50720 + }, + { + "epoch": 4.96, + "learning_rate": 3.537226681428176e-07, + "loss": 0.0942, + "step": 50725 + }, + { + "epoch": 4.96, + "learning_rate": 3.495709936340991e-07, + "loss": 0.0838, + "step": 50730 + }, + { + "epoch": 4.96, + "learning_rate": 3.4541931912538057e-07, + "loss": 0.0821, + "step": 50735 + }, + { + "epoch": 4.96, + "learning_rate": 3.412676446166621e-07, + "loss": 0.0812, + "step": 50740 + }, + { + "epoch": 4.96, + "learning_rate": 3.3711597010794353e-07, + "loss": 0.1065, + "step": 50745 + }, + { + "epoch": 4.96, + "learning_rate": 3.3296429559922504e-07, + "loss": 0.0973, + "step": 50750 + }, + { + "epoch": 4.96, + "learning_rate": 3.288126210905065e-07, + "loss": 0.0799, + "step": 50755 + }, + { + "epoch": 4.96, + "learning_rate": 3.24660946581788e-07, + "loss": 0.1003, + "step": 50760 + }, + { + "epoch": 4.96, + "learning_rate": 3.2050927207306946e-07, + "loss": 0.0752, + "step": 50765 + }, + { + "epoch": 4.96, + "learning_rate": 3.16357597564351e-07, + "loss": 0.0741, + "step": 50770 + }, + { + "epoch": 4.96, + "learning_rate": 3.1220592305563243e-07, + "loss": 0.0989, + "step": 50775 + }, + { + "epoch": 4.97, + "learning_rate": 3.0805424854691394e-07, + "loss": 0.0842, + "step": 50780 + }, + { + "epoch": 4.97, + "learning_rate": 3.039025740381954e-07, + "loss": 0.0758, + "step": 50785 + }, + { + "epoch": 4.97, + "learning_rate": 2.997508995294769e-07, + "loss": 0.0889, + "step": 50790 + }, + { + "epoch": 4.97, + "learning_rate": 2.9559922502075836e-07, + "loss": 0.1008, + "step": 50795 + }, + { + "epoch": 4.97, + "learning_rate": 2.9144755051203987e-07, + "loss": 0.0777, + "step": 50800 + }, + { + "epoch": 4.97, + "learning_rate": 2.8729587600332133e-07, + "loss": 0.0799, + "step": 50805 + }, + { + "epoch": 4.97, + "learning_rate": 2.8314420149460284e-07, + "loss": 0.0939, + "step": 50810 + }, + { + "epoch": 4.97, + "learning_rate": 2.7899252698588435e-07, + "loss": 0.076, + "step": 50815 + }, + { + "epoch": 4.97, + "learning_rate": 2.748408524771658e-07, + "loss": 0.0742, + "step": 50820 + }, + { + "epoch": 4.97, + "learning_rate": 2.7068917796844726e-07, + "loss": 0.0981, + "step": 50825 + }, + { + "epoch": 4.97, + "learning_rate": 2.6653750345972877e-07, + "loss": 0.093, + "step": 50830 + }, + { + "epoch": 4.97, + "learning_rate": 2.623858289510103e-07, + "loss": 0.0684, + "step": 50835 + }, + { + "epoch": 4.97, + "learning_rate": 2.5823415444229174e-07, + "loss": 0.084, + "step": 50840 + }, + { + "epoch": 4.97, + "learning_rate": 2.540824799335732e-07, + "loss": 0.096, + "step": 50845 + }, + { + "epoch": 4.97, + "learning_rate": 2.499308054248547e-07, + "loss": 0.0874, + "step": 50850 + }, + { + "epoch": 4.97, + "learning_rate": 2.457791309161362e-07, + "loss": 0.0905, + "step": 50855 + }, + { + "epoch": 4.97, + "learning_rate": 2.4162745640741767e-07, + "loss": 0.1134, + "step": 50860 + }, + { + "epoch": 4.97, + "learning_rate": 2.3747578189869913e-07, + "loss": 0.0801, + "step": 50865 + }, + { + "epoch": 4.97, + "learning_rate": 2.3332410738998064e-07, + "loss": 0.0794, + "step": 50870 + }, + { + "epoch": 4.97, + "learning_rate": 2.291724328812621e-07, + "loss": 0.0928, + "step": 50875 + }, + { + "epoch": 4.98, + "learning_rate": 2.250207583725436e-07, + "loss": 0.0994, + "step": 50880 + }, + { + "epoch": 4.98, + "learning_rate": 2.2086908386382506e-07, + "loss": 0.08, + "step": 50885 + }, + { + "epoch": 4.98, + "learning_rate": 2.1671740935510657e-07, + "loss": 0.0886, + "step": 50890 + }, + { + "epoch": 4.98, + "learning_rate": 2.1256573484638805e-07, + "loss": 0.0941, + "step": 50895 + }, + { + "epoch": 4.98, + "learning_rate": 2.0841406033766953e-07, + "loss": 0.0893, + "step": 50900 + }, + { + "epoch": 4.98, + "learning_rate": 2.0426238582895102e-07, + "loss": 0.0726, + "step": 50905 + }, + { + "epoch": 4.98, + "learning_rate": 2.001107113202325e-07, + "loss": 0.0956, + "step": 50910 + }, + { + "epoch": 4.98, + "learning_rate": 1.9595903681151398e-07, + "loss": 0.0769, + "step": 50915 + }, + { + "epoch": 4.98, + "learning_rate": 1.9180736230279547e-07, + "loss": 0.0722, + "step": 50920 + }, + { + "epoch": 4.98, + "learning_rate": 1.8765568779407695e-07, + "loss": 0.0853, + "step": 50925 + }, + { + "epoch": 4.98, + "learning_rate": 1.8350401328535843e-07, + "loss": 0.084, + "step": 50930 + }, + { + "epoch": 4.98, + "learning_rate": 1.7935233877663992e-07, + "loss": 0.0861, + "step": 50935 + }, + { + "epoch": 4.98, + "learning_rate": 1.760309991696651e-07, + "loss": 0.092, + "step": 50940 + }, + { + "epoch": 4.98, + "learning_rate": 1.718793246609466e-07, + "loss": 0.1014, + "step": 50945 + }, + { + "epoch": 4.98, + "learning_rate": 1.6772765015222808e-07, + "loss": 0.0822, + "step": 50950 + }, + { + "epoch": 4.98, + "learning_rate": 1.6357597564350956e-07, + "loss": 0.0748, + "step": 50955 + }, + { + "epoch": 4.98, + "learning_rate": 1.5942430113479104e-07, + "loss": 0.1035, + "step": 50960 + }, + { + "epoch": 4.98, + "learning_rate": 1.5527262662607253e-07, + "loss": 0.082, + "step": 50965 + }, + { + "epoch": 4.98, + "learning_rate": 1.51120952117354e-07, + "loss": 0.0868, + "step": 50970 + }, + { + "epoch": 4.98, + "learning_rate": 1.469692776086355e-07, + "loss": 0.0955, + "step": 50975 + }, + { + "epoch": 4.99, + "learning_rate": 1.4281760309991698e-07, + "loss": 0.0984, + "step": 50980 + }, + { + "epoch": 4.99, + "learning_rate": 1.3866592859119843e-07, + "loss": 0.08, + "step": 50985 + }, + { + "epoch": 4.99, + "learning_rate": 1.3451425408247994e-07, + "loss": 0.0865, + "step": 50990 + }, + { + "epoch": 4.99, + "learning_rate": 1.303625795737614e-07, + "loss": 0.0983, + "step": 50995 + }, + { + "epoch": 4.99, + "learning_rate": 1.262109050650429e-07, + "loss": 0.0776, + "step": 51000 + }, + { + "epoch": 4.99, + "eval_cer": 0.052439354315087026, + "eval_loss": 0.21685931086540222, + "eval_runtime": 273.3393, + "eval_samples_per_second": 59.889, + "eval_steps_per_second": 1.665, + "eval_wer": 0.13511554560117015, + "step": 51000 + }, + { + "epoch": 4.99, + "learning_rate": 1.2205923055632437e-07, + "loss": 0.0917, + "step": 51005 + }, + { + "epoch": 4.99, + "learning_rate": 1.1790755604760588e-07, + "loss": 0.1064, + "step": 51010 + }, + { + "epoch": 4.99, + "learning_rate": 1.1375588153888736e-07, + "loss": 0.0961, + "step": 51015 + }, + { + "epoch": 4.99, + "learning_rate": 1.0960420703016884e-07, + "loss": 0.081, + "step": 51020 + }, + { + "epoch": 4.99, + "learning_rate": 1.0545253252145032e-07, + "loss": 0.1067, + "step": 51025 + }, + { + "epoch": 4.99, + "learning_rate": 1.0130085801273181e-07, + "loss": 0.0816, + "step": 51030 + }, + { + "epoch": 4.99, + "learning_rate": 9.714918350401329e-08, + "loss": 0.0828, + "step": 51035 + }, + { + "epoch": 4.99, + "learning_rate": 9.299750899529477e-08, + "loss": 0.0709, + "step": 51040 + }, + { + "epoch": 4.99, + "learning_rate": 8.884583448657626e-08, + "loss": 0.097, + "step": 51045 + }, + { + "epoch": 4.99, + "learning_rate": 8.469415997785774e-08, + "loss": 0.0788, + "step": 51050 + }, + { + "epoch": 4.99, + "learning_rate": 8.054248546913922e-08, + "loss": 0.0754, + "step": 51055 + }, + { + "epoch": 4.99, + "learning_rate": 7.63908109604207e-08, + "loss": 0.108, + "step": 51060 + }, + { + "epoch": 4.99, + "learning_rate": 7.223913645170219e-08, + "loss": 0.0984, + "step": 51065 + }, + { + "epoch": 4.99, + "learning_rate": 6.808746194298367e-08, + "loss": 0.0986, + "step": 51070 + }, + { + "epoch": 4.99, + "learning_rate": 6.393578743426516e-08, + "loss": 0.0879, + "step": 51075 + }, + { + "epoch": 4.99, + "learning_rate": 5.978411292554664e-08, + "loss": 0.0833, + "step": 51080 + }, + { + "epoch": 5.0, + "learning_rate": 5.563243841682812e-08, + "loss": 0.0754, + "step": 51085 + }, + { + "epoch": 5.0, + "learning_rate": 5.1480763908109605e-08, + "loss": 0.0929, + "step": 51090 + }, + { + "epoch": 5.0, + "learning_rate": 4.732908939939109e-08, + "loss": 0.1044, + "step": 51095 + }, + { + "epoch": 5.0, + "learning_rate": 4.317741489067257e-08, + "loss": 0.0749, + "step": 51100 + }, + { + "epoch": 5.0, + "learning_rate": 3.9025740381954054e-08, + "loss": 0.0949, + "step": 51105 + }, + { + "epoch": 5.0, + "learning_rate": 3.4874065873235544e-08, + "loss": 0.1079, + "step": 51110 + }, + { + "epoch": 5.0, + "learning_rate": 3.0722391364517027e-08, + "loss": 0.0746, + "step": 51115 + }, + { + "epoch": 5.0, + "learning_rate": 2.6570716855798506e-08, + "loss": 0.0819, + "step": 51120 + }, + { + "epoch": 5.0, + "learning_rate": 2.241904234707999e-08, + "loss": 0.0982, + "step": 51125 + }, + { + "epoch": 5.0, + "learning_rate": 1.8267367838361473e-08, + "loss": 0.0813, + "step": 51130 + }, + { + "epoch": 5.0, + "step": 51130, + "total_flos": 9.155008453907925e+20, + "train_loss": 0.13587924622752628, + "train_runtime": 175088.5296, + "train_samples_per_second": 31.54, + "train_steps_per_second": 0.292 + } + ], + "logging_steps": 5, + "max_steps": 51130, + "num_input_tokens_seen": 0, + "num_train_epochs": 5, + "save_steps": 1000, + "total_flos": 9.155008453907925e+20, + "train_batch_size": 12, + "trial_name": null, + "trial_params": null +}